interscript-maps 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: royin
|
|
3
|
+
id: 1968-chained
|
|
4
|
+
language: iso-639-2:tha
|
|
5
|
+
source_script: Thai
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Royal Thai General System of Transcription (1968)
|
|
8
|
+
url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
|
|
9
|
+
creation_date: 1968
|
|
10
|
+
adoption_date:
|
|
11
|
+
description: |
|
|
12
|
+
This map loads two external maps to convert Thai text first into phonemic Thai,
|
|
13
|
+
and then into IPA transcription.
|
|
14
|
+
|
|
15
|
+
The IPA transcription will then be handled by this map, and converted into
|
|
16
|
+
Royal Thai General System of Transcription (1968).
|
|
17
|
+
|
|
18
|
+
The first two parts are done via two external maps.
|
|
19
|
+
|
|
20
|
+
notes: |
|
|
21
|
+
The conversion from Thai to Phonemic Thai is still work-in-progress.
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
tests {
|
|
25
|
+
test "สะพาน", "saphan"
|
|
26
|
+
test "ลานตา", "lanta"
|
|
27
|
+
test "บาง", "bang"
|
|
28
|
+
test "สมุทร", "samut"
|
|
29
|
+
test "ลำ", "lam"
|
|
30
|
+
test "สิงห์", "sing"
|
|
31
|
+
test "บุรี", "buri"
|
|
32
|
+
test "สตึก", "satuk"
|
|
33
|
+
test "พืช", "phut"
|
|
34
|
+
test "บรบือ", "borabu"
|
|
35
|
+
test "ภู", "phu"
|
|
36
|
+
test "ปะนาเระ", "panare"
|
|
37
|
+
test "เพ็ญ", "phen"
|
|
38
|
+
# - source: "เขน"
|
|
39
|
+
# expected: "khen"
|
|
40
|
+
test "แซะ", "sae"
|
|
41
|
+
# - source: "สะแก"
|
|
42
|
+
# expected: "sakae"
|
|
43
|
+
test "พะโต๊ะ", "phato"
|
|
44
|
+
test "ลพ", "lop"
|
|
45
|
+
# - source: "สามโก้"
|
|
46
|
+
# expected: "samko"
|
|
47
|
+
test "เกาะ", "ko"
|
|
48
|
+
test "บ่อ", "bo"
|
|
49
|
+
test "เซอะ", "soe"
|
|
50
|
+
test "อำเภอ", "amphoe"
|
|
51
|
+
test "เนิน", "noen"
|
|
52
|
+
# - source: "เพียะ"
|
|
53
|
+
# expected: "phia"
|
|
54
|
+
test "เทียน", "thian"
|
|
55
|
+
# - source: "เกือะ"
|
|
56
|
+
# expected: "kua"
|
|
57
|
+
test "เมือง", "muang"
|
|
58
|
+
# - source: "ผัวะ"
|
|
59
|
+
# expected: "phua"
|
|
60
|
+
test "บัว", "bua"
|
|
61
|
+
# - source: "ควน"
|
|
62
|
+
# expected: "khuan"
|
|
63
|
+
test "ใหญ่", "yai"
|
|
64
|
+
# - source: "ไผ่"
|
|
65
|
+
# expected: "phai"
|
|
66
|
+
test "ชัย", "chai"
|
|
67
|
+
test "ไทย", "thai"
|
|
68
|
+
# - source: "ปาย"
|
|
69
|
+
# expected: "pai"
|
|
70
|
+
test "เจ้า", "chao"
|
|
71
|
+
test "ข้าว", "khao"
|
|
72
|
+
# - source: "กุย"
|
|
73
|
+
# expected: "kui"
|
|
74
|
+
test "โดย", "doi"
|
|
75
|
+
# - source: "ดอย"
|
|
76
|
+
# expected: "doi"
|
|
77
|
+
# - source: "งิ้ว"
|
|
78
|
+
# expected: "ngiu"
|
|
79
|
+
test "เร็ว", "reo"
|
|
80
|
+
# - source: "เลว"
|
|
81
|
+
# expected: "leo"
|
|
82
|
+
# - source: "เลย"
|
|
83
|
+
# expected: "loei"
|
|
84
|
+
# - source: "เดือย"
|
|
85
|
+
# expected: "duai"
|
|
86
|
+
# - source: "ห้วย"
|
|
87
|
+
# expected: "huai"
|
|
88
|
+
test "แมว", "maeo"
|
|
89
|
+
test "เขียว", "khieu"
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
# This map has been partially converted by the bin/maps_v1_to_v2 script
|
|
93
|
+
# The section below requires human attention. Remember to remove this
|
|
94
|
+
# comment and move the converted map to 'maps/' directory. Please also
|
|
95
|
+
# take note that the maps-staging directory will be cleaned up whenever
|
|
96
|
+
# you run the bin/maps_v1_to_v2 script. You should particularly be
|
|
97
|
+
# concerned about any regular expressions found in this file and about
|
|
98
|
+
# advanced expressions in parallel {} parts, and also about the order
|
|
99
|
+
# of particular parts of the stage.
|
|
100
|
+
|
|
101
|
+
dependency "var-tha-Thai-Thai-phonemic", as: thaiphonemic
|
|
102
|
+
dependency "var-tha-Thai-Zsym-ipa", as: thaizsym
|
|
103
|
+
|
|
104
|
+
stage {
|
|
105
|
+
run map.thaiphonemic.stage.main
|
|
106
|
+
run map.thaizsym.stage.main
|
|
107
|
+
|
|
108
|
+
# DICTIONARY
|
|
109
|
+
parallel {
|
|
110
|
+
|
|
111
|
+
sub "̯", ""
|
|
112
|
+
sub "̚", ""
|
|
113
|
+
|
|
114
|
+
sub "ʔ", ""
|
|
115
|
+
sub "ː", ""
|
|
116
|
+
|
|
117
|
+
sub "t͡ɕʰ", "ch"
|
|
118
|
+
sub "t͡ɕ", "ch"
|
|
119
|
+
sub "ŋ", "ng"
|
|
120
|
+
sub "j", "y"
|
|
121
|
+
sub "ɔ", "o"
|
|
122
|
+
sub "ɤ", "oe"
|
|
123
|
+
sub "ɛ", "ae"
|
|
124
|
+
sub "ɯ", "u"
|
|
125
|
+
sub "ʰ", "h"
|
|
126
|
+
|
|
127
|
+
sub "aːw", "ao"
|
|
128
|
+
sub "aw", "ao"
|
|
129
|
+
sub "a̯w", "eu"
|
|
130
|
+
sub "eːw", "eo"
|
|
131
|
+
sub "ew", "eo"
|
|
132
|
+
sub "ɛːw", "aeo"
|
|
133
|
+
sub "ɛw", "aeo"
|
|
134
|
+
sub "iːw", "iu"
|
|
135
|
+
sub "iw", "iu"
|
|
136
|
+
|
|
137
|
+
sub "aːj", "ai"
|
|
138
|
+
sub "aj", "ai"
|
|
139
|
+
sub "a̯j", "ai"
|
|
140
|
+
sub "ɔːj", "oi"
|
|
141
|
+
sub "ɔj", "oi"
|
|
142
|
+
sub "oːj", "oi"
|
|
143
|
+
sub "oj", "oi"
|
|
144
|
+
sub "ɤːj", "oei"
|
|
145
|
+
sub "ɤj", "oei"
|
|
146
|
+
sub "uːj", "ui"
|
|
147
|
+
sub "uj", "ui"
|
|
148
|
+
}
|
|
149
|
+
|
|
150
|
+
# RULES
|
|
151
|
+
sub any("˩˨˧˦˥"), ""
|
|
152
|
+
sub line_start, "."
|
|
153
|
+
|
|
154
|
+
# POSTRULES
|
|
155
|
+
sub ".", ""
|
|
156
|
+
}
|
|
@@ -0,0 +1,161 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: royin
|
|
3
|
+
id: 1999-chained
|
|
4
|
+
language: iso-639-2:tha
|
|
5
|
+
source_script: Thai
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Royal Thai General System of Transcription (1999)
|
|
8
|
+
url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
|
|
9
|
+
creation_date: 1999
|
|
10
|
+
adoption_date:
|
|
11
|
+
description: |
|
|
12
|
+
This map loads two external maps to convert Thai text first into phonemic Thai,
|
|
13
|
+
and then into IPA transcription.
|
|
14
|
+
|
|
15
|
+
The IPA transcription will then be handled by this map, and converted into
|
|
16
|
+
Royal Thai General System of Transcription (1999)
|
|
17
|
+
|
|
18
|
+
The first two parts are done via two external maps.
|
|
19
|
+
|
|
20
|
+
notes: |
|
|
21
|
+
The conversion from Thai to Phonemic Thai is still work-in-progress.
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
tests {
|
|
25
|
+
test "สะพาน", "saphan"
|
|
26
|
+
test "ลานตา", "lanta"
|
|
27
|
+
test "บาง", "bang"
|
|
28
|
+
test "สมุทร", "samut"
|
|
29
|
+
test "ลำ", "lam"
|
|
30
|
+
test "สิงห์", "sing"
|
|
31
|
+
test "บุรี", "buri"
|
|
32
|
+
test "สตึก", "satuek"
|
|
33
|
+
test "พืช", "phuet"
|
|
34
|
+
test "บรบือ", "borabue"
|
|
35
|
+
test "ภู", "phu"
|
|
36
|
+
test "ปะนาเระ", "panare"
|
|
37
|
+
test "เพ็ญ", "phen"
|
|
38
|
+
# - source: "เขน"
|
|
39
|
+
# expected: "khen"
|
|
40
|
+
test "แซะ", "sae"
|
|
41
|
+
# - source: "สะแก"
|
|
42
|
+
# expected: "sakae"
|
|
43
|
+
test "พะโต๊ะ", "phato"
|
|
44
|
+
test "ลพ", "lop"
|
|
45
|
+
# - source: "สามโก้"
|
|
46
|
+
# expected: "samko"
|
|
47
|
+
test "เกาะ", "ko"
|
|
48
|
+
test "บ่อ", "bo"
|
|
49
|
+
test "เซอะ", "soe"
|
|
50
|
+
test "อำเภอ", "amphoe"
|
|
51
|
+
test "เนิน", "noen"
|
|
52
|
+
# - source: "เพียะ"
|
|
53
|
+
# expected: "phia"
|
|
54
|
+
test "เทียน", "thian"
|
|
55
|
+
# - source: "เกือะ"
|
|
56
|
+
# expected: "kuea"
|
|
57
|
+
test "เมือง", "mueang"
|
|
58
|
+
# - source: "ผัวะ"
|
|
59
|
+
# expected: "phua"
|
|
60
|
+
test "บัว", "bua"
|
|
61
|
+
# - source: "ควน"
|
|
62
|
+
# expected: "khuan"
|
|
63
|
+
test "ใหญ่", "yai"
|
|
64
|
+
# - source: "ไผ่"
|
|
65
|
+
# expected: "phai"
|
|
66
|
+
test "ชัย", "chai"
|
|
67
|
+
test "ไทย", "thai"
|
|
68
|
+
# - source: "ปาย"
|
|
69
|
+
# expected: "pai"
|
|
70
|
+
test "เจ้า", "chao"
|
|
71
|
+
test "ข้าว", "khao"
|
|
72
|
+
# - source: "กุย"
|
|
73
|
+
# expected: "kui"
|
|
74
|
+
test "โดย", "doi"
|
|
75
|
+
# - source: "ดอย"
|
|
76
|
+
# expected: "doi"
|
|
77
|
+
# - source: "งิ้ว"
|
|
78
|
+
# expected: "ngio"
|
|
79
|
+
test "เร็ว", "reo"
|
|
80
|
+
# - source: "เลว"
|
|
81
|
+
# expected: "leo"
|
|
82
|
+
# - source: "เลย"
|
|
83
|
+
# expected: "loei"
|
|
84
|
+
# - source: "เดือย"
|
|
85
|
+
# expected: "dueai"
|
|
86
|
+
# - source: "ห้วย"
|
|
87
|
+
# expected: "huai"
|
|
88
|
+
test "แมว", "maeo"
|
|
89
|
+
test "เขียว", "khiao"
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
# This map has been partially converted by the bin/maps_v1_to_v2 script
|
|
93
|
+
# The section below requires human attention. Remember to remove this
|
|
94
|
+
# comment and move the converted map to 'maps/' directory. Please also
|
|
95
|
+
# take note that the maps-staging directory will be cleaned up whenever
|
|
96
|
+
# you run the bin/maps_v1_to_v2 script. You should particularly be
|
|
97
|
+
# concerned about any regular expressions found in this file and about
|
|
98
|
+
# advanced expressions in parallel {} parts, and also about the order
|
|
99
|
+
# of particular parts of the stage.
|
|
100
|
+
|
|
101
|
+
dependency "var-tha-Thai-Thai-phonemic", as: thaiphonemic
|
|
102
|
+
dependency "var-tha-Thai-Zsym-ipa", as: thaizsym
|
|
103
|
+
|
|
104
|
+
stage {
|
|
105
|
+
run map.thaiphonemic.stage.main
|
|
106
|
+
run map.thaizsym.stage.main
|
|
107
|
+
|
|
108
|
+
# DICTIONARY
|
|
109
|
+
parallel {
|
|
110
|
+
|
|
111
|
+
sub "̯", ""
|
|
112
|
+
sub "̚", ""
|
|
113
|
+
|
|
114
|
+
sub "ʔ", ""
|
|
115
|
+
sub "ː", ""
|
|
116
|
+
|
|
117
|
+
sub "t͡ɕʰ", "ch"
|
|
118
|
+
sub "t͡ɕ", "ch"
|
|
119
|
+
sub "ŋ", "ng"
|
|
120
|
+
sub "j", "y"
|
|
121
|
+
sub "ɔ", "o"
|
|
122
|
+
sub "ɤ", "oe"
|
|
123
|
+
sub "ɛ", "ae"
|
|
124
|
+
sub "ɯ", "ue" # New spelling, was u in 1968
|
|
125
|
+
sub "ʰ", "h"
|
|
126
|
+
|
|
127
|
+
sub "aːw", "ao"
|
|
128
|
+
sub "aw", "ao"
|
|
129
|
+
sub "a̯w", "ao" # New spelling, was eu in 1968
|
|
130
|
+
sub "eːw", "eo"
|
|
131
|
+
sub "ew", "eo"
|
|
132
|
+
sub "ɛːw", "aeo"
|
|
133
|
+
sub "ɛw", "aeo"
|
|
134
|
+
sub "iːw", "io" # New spelling, was iu in 1968
|
|
135
|
+
sub "iw", "io" # New spelling, was iu in 1968
|
|
136
|
+
|
|
137
|
+
sub "aːj", "ai"
|
|
138
|
+
sub "aj", "ai"
|
|
139
|
+
sub "a̯j", "ai"
|
|
140
|
+
sub "ɔːj", "oi"
|
|
141
|
+
sub "ɔj", "oi"
|
|
142
|
+
sub "oːj", "oi"
|
|
143
|
+
sub "oj", "oi"
|
|
144
|
+
sub "ɤːj", "oei"
|
|
145
|
+
sub "ɤj", "oei"
|
|
146
|
+
sub "uːj", "ui"
|
|
147
|
+
sub "uj", "ui"
|
|
148
|
+
}
|
|
149
|
+
|
|
150
|
+
# RULES
|
|
151
|
+
sub any("˩˨˧˦˥"), ""
|
|
152
|
+
sub line_start, "."
|
|
153
|
+
|
|
154
|
+
# CHARACTERS
|
|
155
|
+
parallel {
|
|
156
|
+
|
|
157
|
+
}
|
|
158
|
+
|
|
159
|
+
# POSTRULES
|
|
160
|
+
sub ".", ""
|
|
161
|
+
}
|
|
@@ -0,0 +1,78 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: royin
|
|
3
|
+
id: 1999
|
|
4
|
+
language: iso-639-2:tha
|
|
5
|
+
source_script: Thai
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Royal Thai General System of Transcription (1999)
|
|
8
|
+
url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
|
|
9
|
+
creation_date: 1999
|
|
10
|
+
adoption_date:
|
|
11
|
+
description:
|
|
12
|
+
|
|
13
|
+
notes: |
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
tests {
|
|
17
|
+
test "ภาษาไทย", "phasathai"
|
|
18
|
+
test "ไทย", "thai"
|
|
19
|
+
test "เชียงใหม่", "chiangmai"
|
|
20
|
+
test "ใหม่", "mai"
|
|
21
|
+
test "ใคร", "khrai"
|
|
22
|
+
test "ที่", "thi"
|
|
23
|
+
test "เป็น", "pen"
|
|
24
|
+
test "ใน", "nai"
|
|
25
|
+
test "การ", "kan"
|
|
26
|
+
test "มี", "mi"
|
|
27
|
+
test "ได้", "dai"
|
|
28
|
+
test "ของ", "khong"
|
|
29
|
+
test "ไม่", "mai"
|
|
30
|
+
test "สถานีปางต้นผึ้ง", "sathanipangtonphueng"
|
|
31
|
+
test "ไพศาลี", "phaisali"
|
|
32
|
+
test "โรงเรียนไม้เรียงประชาสรรค์", "rongrianmairiangprachasan"
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
# This map has been partially converted by the bin/maps_v1_to_v2 script
|
|
36
|
+
# The section below requires human attention. Remember to remove this
|
|
37
|
+
# comment and move the converted map to 'maps/' directory. Please also
|
|
38
|
+
# take note that the maps-staging directory will be cleaned up whenever
|
|
39
|
+
# you run the bin/maps_v1_to_v2 script. You should particularly be
|
|
40
|
+
# concerned about any regular expressions found in this file and about
|
|
41
|
+
# advanced expressions in parallel {} parts, and also about the order
|
|
42
|
+
# of particular parts of the stage.
|
|
43
|
+
|
|
44
|
+
|
|
45
|
+
stage {
|
|
46
|
+
|
|
47
|
+
# DICTIONARY
|
|
48
|
+
parallel {
|
|
49
|
+
sub "ʰ", "h"
|
|
50
|
+
sub "c", "ch"
|
|
51
|
+
sub "ː", ""
|
|
52
|
+
sub "ŋ", "ng"
|
|
53
|
+
sub "j", "i"
|
|
54
|
+
sub "w", "o"
|
|
55
|
+
sub "ɔ", "o"
|
|
56
|
+
sub "ɤ", "oe"
|
|
57
|
+
sub "ɛ", "ae"
|
|
58
|
+
sub "ɯ", "ue"
|
|
59
|
+
sub "ʔ", ""
|
|
60
|
+
sub "t͡ɕ", "c"
|
|
61
|
+
sub any_character, ""
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
# RULES
|
|
65
|
+
|
|
66
|
+
# CHARACTERS
|
|
67
|
+
parallel {
|
|
68
|
+
sub any("0".."9"), ""
|
|
69
|
+
|
|
70
|
+
}
|
|
71
|
+
|
|
72
|
+
# POSTRULES
|
|
73
|
+
sub "chh", "ch"
|
|
74
|
+
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
# This map contains transcription and probably depends on seq2seq:
|
|
78
|
+
# transcription: sequitur.pythainlp_lexicon
|
|
@@ -0,0 +1,53 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: var
|
|
3
|
+
id: phonemic
|
|
4
|
+
language: iso-639-2:tha
|
|
5
|
+
source_script: Thai
|
|
6
|
+
destination_script: Thai
|
|
7
|
+
name: Phonemic Thai (Royal Thai General Dictionary)
|
|
8
|
+
url:
|
|
9
|
+
creation_date:
|
|
10
|
+
adoption_date:
|
|
11
|
+
description:
|
|
12
|
+
This map performs two tasks.
|
|
13
|
+
|
|
14
|
+
First the text is segmented using a dictionary.
|
|
15
|
+
Then Thai texts will be sent to an external module to get converted into
|
|
16
|
+
Phonemic Thai.
|
|
17
|
+
|
|
18
|
+
Note that the accuracy for vowel length distinction and certain tonal alternation
|
|
19
|
+
is low.
|
|
20
|
+
|
|
21
|
+
notes: |
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
tests {
|
|
25
|
+
test "ที่เปิดขวด", "ที่-เปิด-ขวด"
|
|
26
|
+
test "พื้นหลัง", "พื้น-หฺลัง"
|
|
27
|
+
test "สมชาย", "สม-ชาย"
|
|
28
|
+
test "อ่อนข้อ", "อ็่อน-ค่อ"
|
|
29
|
+
test "โครยอ", "โค-ระ-ยอ"
|
|
30
|
+
test "ไล่ออก", "ไล่-ออก"
|
|
31
|
+
test "ไส้เลื่อน", "ไส้-เลื่อน"
|
|
32
|
+
test "ความวาว", "คฺวาม-วาว"
|
|
33
|
+
test "ไอกรน", "ไอ-กฺรน"
|
|
34
|
+
test "ไอซียู", "ไอ-ซี-ยู"
|
|
35
|
+
test "ไอซ์แลนด์", "ไอ๊ส-แลน"
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
# This map has been partially converted by the bin/maps_v1_to_v2 script
|
|
39
|
+
# The section below requires human attention. Remember to remove this
|
|
40
|
+
# comment and move the converted map to 'maps/' directory. Please also
|
|
41
|
+
# take note that the maps-staging directory will be cleaned up whenever
|
|
42
|
+
# you run the bin/maps_v1_to_v2 script. You should particularly be
|
|
43
|
+
# concerned about any regular expressions found in this file and about
|
|
44
|
+
# advanced expressions in parallel {} parts, and also about the order
|
|
45
|
+
# of particular parts of the stage.
|
|
46
|
+
|
|
47
|
+
# Not yet implemented
|
|
48
|
+
|
|
49
|
+
stage {
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
# This map contains transcription and probably depends on seq2seq:
|
|
53
|
+
# transcription: sequitur.wiktionary_phonemic
|