interscript-maps 2.0.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
@@ -0,0 +1,63 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 2011
|
4
|
+
language: iso-639-2:sin
|
5
|
+
source_script: Sinh
|
6
|
+
destination_script: Latn
|
7
|
+
name: Sinhalese Romanization, 2011
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/sinhales.pdf
|
9
|
+
creation_date: 2011
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Sinhalese
|
12
|
+
|
13
|
+
|
14
|
+
notes:
|
15
|
+
|
16
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
17
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
18
|
+
made in transliteration.
|
19
|
+
|
20
|
+
- |
|
21
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
22
|
+
transliteration, with the following exceptions:
|
23
|
+
|
24
|
+
a) when another vowel is indicated by its appropriate sign; and
|
25
|
+
b) when the absence of any vowel is indicated by the sign ් called virāma.
|
26
|
+
|
27
|
+
- |
|
28
|
+
Exceptions: Anusvāra is transliterated by:
|
29
|
+
|
30
|
+
a) ṅ before gutturals,
|
31
|
+
b) ñ before palatals,
|
32
|
+
c) ṇ before cerebrals,
|
33
|
+
d) n before dentals, and
|
34
|
+
e) m before labials.
|
35
|
+
|
36
|
+
- |
|
37
|
+
Exceptions:
|
38
|
+
a) when saññaka represents a nasal, it is romanized according to the rule for anusvāra.
|
39
|
+
b) when saññaka is combined with an aspirated consonant, the combination is romanized as a non-aspirated, followed by an aspirated consonant.
|
40
|
+
}
|
41
|
+
|
42
|
+
tests {
|
43
|
+
test "හිටපු අග්රාමාත්ය රනිල් වික්රමසිංහ අප්රේල් 21 ප්රහාරය සම්බන්ධයෙන් විමර්ශනය කරන ජනාධිපති පරීක්ෂණ කොමිසම හමුවේ දෙවෙනි දිනටත් සාක්ෂි ලබාදීමට පැමිණෙයි", "hiṭapu agrāmātya ranil vikramasiṃha aprēl 21 prahāraya sambanandhayen vimarśanaya karana janādhipati parīkṣaṇa komisama hamuvē deveni dinaṭat sākṣi labādīmaṭa pămiṇeyi"
|
44
|
+
test "පෑලියගොඩ මත්ස්ය තොග වෙළෙදපොළට පිවිසෙන පිවිසුම් මාර්ගය පුළුල් කර සංවර්ධනයට පියවර - මහාමාර්ග අමාත්ය ජොන්ස්ටන් ප්රනාන්දු", "pâliyagoḍa matsya toga veḷedapoḷaṭa pivisena pivisum māraṅgaya puḷul kara saṃvarandhanayaṭa piyavara - mahāmāraṅga amātya jonsaṇṭan pranānandu"
|
45
|
+
test "මව්බිමටත් රට වැසියන්ටත් ආශිර්වාද කරමින් විශේෂ ආගමික වැඩසටහන් මාලාවක්", "mavbimaṭat raṭa văsiyanaṇṭat āśirvāda karamin viśēṣa āgamika văḍasaṭahan mālāvak"
|
46
|
+
test "මිනුවන්ගොඩ කොරෝනා පොකුරින් තවත් ආසාදිතයින් 49 දෙනකු හඳුනා ගෙන", "minuvanaṅgoḍa korōnā pokurin tavat āsāditayin 49 denaku handunā gena"
|
47
|
+
test "ඉරණවිල වෙරළේ නාඳුනන ධීවර යාත්රා දෙකක්", "iraṇavila veraḷē nāndunana dhīvara yātarā dekak"
|
48
|
+
test "මඩකලපුව මංගලාරාමේ හාමුදුරුවන්ට මරණ තර්ජන - ආරක්ෂාවත් අඩුකරලා", "maḍakalapuva maṃgalārāmē hāmuduruvanaṇṭa maraṇa tarañjana - ārakṣāvat aḍukaralā"
|
49
|
+
test "හොරට කහ කුඩු හැදූ දෙදෙනෙක් බඩුත් එක්ක දැලේ", "horaṭa kaha kuḍu hădū dedenek baḍut ekaṅka dălē"
|
50
|
+
test "ඉංගිරියේ ජලභීතිකාව වැළඳුනු නරියෙකු තෙදිනක මෙහෙයුමකින් අල්ලා ගනී", "iṃgiriyē jalabhītikāva văḷandunu nariyeku tedinaka meheyumakin allā ganī"
|
51
|
+
test "බෞද්ධ දර්ශනයට අනුව අපි උපයන ධනය බුද්ධිමත් ලෙස විසර්ජනය කරන්නේ කෙසේ ද?", "baudandha darśanayaṭa anuva api upayana dhanaya budandhimat lesa visarañjanaya karanannē kesē da?"
|
52
|
+
test "ඉන්දීය ජාතිකයන් සමග එක්වන මන්නාරමේ ධීවරයන්ට අනතුරු අගවයි", "inandīya jātikayan samaga ekvana manannāramē dhīvarayanaṇṭa anaturu agavayi"
|
53
|
+
test "තේ නැවත වගාවට පෙර පස පුනරුත්ථාපනයට කෙටි මග", "tē năvata vagāvaṭa pera pasa punarutanthāpanayaṭa keṭi maga"
|
54
|
+
}
|
55
|
+
|
56
|
+
dependency "alalc-sin-Sinh-Latn-1997", as: sinhlatn
|
57
|
+
|
58
|
+
stage {
|
59
|
+
|
60
|
+
run map.sinhlatn.stage.main
|
61
|
+
|
62
|
+
}
|
63
|
+
|
@@ -0,0 +1,124 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:srp
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: Serbian and Makedonian Romanization, ALA-LC 1997 System
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/serbian.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
description: ALA-LC Romanization table for Serbian and Makedonian.
|
11
|
+
|
12
|
+
notes:
|
13
|
+
- Special characters in romanization
|
14
|
+
Đ - D with crossbar (upper case). USMARC hexadecimal code A3.
|
15
|
+
đ - d with crossbar (upper case). USMARC hexadecimal code B3.
|
16
|
+
|
17
|
+
- Character modifiers in romanization
|
18
|
+
´ - acute. USMARC hexadecimal code E2.
|
19
|
+
ˇ - hachek. USMARC hexadecimal code E9.
|
20
|
+
}
|
21
|
+
|
22
|
+
tests {
|
23
|
+
test "Општина Ердут", "Opština Erdut"
|
24
|
+
test "Општина Двор", "Opština Dvor"
|
25
|
+
test "ЛУЃЕ луѓе", "LUǴE luǵe"
|
26
|
+
test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
|
27
|
+
test "ЌАРУВАЊЕ ќарување", "ḰARUVANJE ḱaruvanje"
|
28
|
+
}
|
29
|
+
|
30
|
+
dependency "posix", import: true
|
31
|
+
|
32
|
+
stage {
|
33
|
+
|
34
|
+
|
35
|
+
# CHARACTERS
|
36
|
+
parallel {
|
37
|
+
sub "А", "A"
|
38
|
+
sub "Б", "B"
|
39
|
+
sub "В", "V"
|
40
|
+
sub "Г", "G"
|
41
|
+
sub "Ѓ", "Ǵ" # Ǵ
|
42
|
+
sub "Д", "D"
|
43
|
+
sub "Ђ", "Đ" # Đ
|
44
|
+
sub "Е", "E"
|
45
|
+
sub "Ж", "Ž" # Ž
|
46
|
+
sub "З", "Z"
|
47
|
+
sub "Ѕ", "Dz"
|
48
|
+
sub "И", "I"
|
49
|
+
sub "Ј", "J"
|
50
|
+
sub "К", "K"
|
51
|
+
sub "Ќ", "Ḱ" # Ḱ
|
52
|
+
sub "Л", "L"
|
53
|
+
sub "Љ", "Lj"
|
54
|
+
sub "М", "M"
|
55
|
+
sub "Н", "N"
|
56
|
+
sub "Њ", "Nj"
|
57
|
+
sub "О", "O"
|
58
|
+
sub "П", "P"
|
59
|
+
sub "Р", "R"
|
60
|
+
sub "С", "S"
|
61
|
+
sub "Т", "T"
|
62
|
+
sub "Ћ", "Ć" # Ć
|
63
|
+
sub "У", "U"
|
64
|
+
sub "Ф", "F"
|
65
|
+
sub "Х", "H"
|
66
|
+
sub "Ц", "C"
|
67
|
+
sub "Ч", "Č" # Č
|
68
|
+
sub "Џ", "Dž" # Dž
|
69
|
+
sub "Ш", "Š" # Š
|
70
|
+
sub "а", "a"
|
71
|
+
sub "б", "b"
|
72
|
+
sub "в", "v"
|
73
|
+
sub "г", "g"
|
74
|
+
sub "ѓ", "ǵ" # ǵ
|
75
|
+
sub "д", "d"
|
76
|
+
sub "ђ", "đ" # đ
|
77
|
+
sub "е", "e"
|
78
|
+
sub "ж", "ž" # ž
|
79
|
+
sub "з", "z"
|
80
|
+
sub "ѕ", "dz"
|
81
|
+
sub "и", "i"
|
82
|
+
sub "ј", "j"
|
83
|
+
sub "к", "k"
|
84
|
+
sub "ќ", "ḱ" # ḱ
|
85
|
+
sub "л", "l"
|
86
|
+
sub "љ", "lj"
|
87
|
+
sub "м", "m"
|
88
|
+
sub "н", "n"
|
89
|
+
sub "њ", "nj"
|
90
|
+
sub "о", "o"
|
91
|
+
sub "п", "p"
|
92
|
+
sub "р", "r"
|
93
|
+
sub "с", "s"
|
94
|
+
sub "т", "t"
|
95
|
+
sub "ћ", "ć" # ć
|
96
|
+
sub "у", "u"
|
97
|
+
sub "ф", "f"
|
98
|
+
sub "х", "h"
|
99
|
+
sub "ц", "c"
|
100
|
+
sub "ч", "č" # č
|
101
|
+
sub "џ", "dž" # dž
|
102
|
+
sub "ш", "š" # š
|
103
|
+
}
|
104
|
+
# POSTRULES
|
105
|
+
# rewritten by hand to work properly
|
106
|
+
# DZ
|
107
|
+
sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
|
108
|
+
sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
|
109
|
+
|
110
|
+
#LJ
|
111
|
+
sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
|
112
|
+
sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
|
113
|
+
|
114
|
+
#NJ
|
115
|
+
sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
|
116
|
+
sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
|
117
|
+
|
118
|
+
#DŽ
|
119
|
+
sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
|
120
|
+
sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
|
121
|
+
|
122
|
+
compose
|
123
|
+
}
|
124
|
+
|
@@ -0,0 +1,115 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 2013
|
4
|
+
language: iso-639-2:srp
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: ROMANIZATION OF SERBIAN, ALA-LC 2013 System
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/serbian.pdf
|
9
|
+
creation_date: 2013
|
10
|
+
description: |
|
11
|
+
Serbian uses the Cyrillic and Roman alphabets. When the Roman alphabet is used it is the same as Croatian.
|
12
|
+
}
|
13
|
+
|
14
|
+
tests {
|
15
|
+
test "Шупља Стена", "Šuplja Stena"
|
16
|
+
test "Чукарица", "Čukarica"
|
17
|
+
test "Црна Трава", "Crna Trava"
|
18
|
+
test "Херцег Нови", "Herceg Novi"
|
19
|
+
test "Улцињ", "Ulcinj"
|
20
|
+
test "Ужице", "Užice"
|
21
|
+
test "Тресаначка Река", "Tresanačka Reka"
|
22
|
+
test "Сјеница", "Sjenica"
|
23
|
+
test "Рожаје", "Rožaje"
|
24
|
+
test "Пљевља", "Pljevlja"
|
25
|
+
test "Оџаци", "Odžaci"
|
26
|
+
test "Никшић", "Nikšić"
|
27
|
+
test "Медвеђа", "Medveđa"
|
28
|
+
test "Лозница", "Loznica"
|
29
|
+
test "Књажевац", "Knjaževac"
|
30
|
+
test "Зрењанин", "Zrenjanin"
|
31
|
+
test "Житорађа", "Žitorađa"
|
32
|
+
test "Ервеник", "Ervenik"
|
33
|
+
test "Доње Љупче", "Donje Ljupče"
|
34
|
+
test "Гусиње", "Gusinje"
|
35
|
+
test "ГУСИЊЕ", "GUSINJE"
|
36
|
+
test "Врњачка Бања", "Vrnjačka Banja"
|
37
|
+
test "Бијело Поље", "Bijelo Polje"
|
38
|
+
test "Алибунар", "Alibunar"
|
39
|
+
}
|
40
|
+
|
41
|
+
aliases {
|
42
|
+
def_alias srp_multichar, any(["Lj", "Nj", "Dž"])
|
43
|
+
def_alias srp_latupper, any("A".."Z")
|
44
|
+
}
|
45
|
+
|
46
|
+
stage {
|
47
|
+
# CHARACTERS
|
48
|
+
parallel {
|
49
|
+
sub "А", "A"
|
50
|
+
sub "Б", "B"
|
51
|
+
sub "В", "V"
|
52
|
+
sub "Г", "G"
|
53
|
+
sub "Д", "D"
|
54
|
+
sub "Ђ", "Đ" # Đ
|
55
|
+
sub "Е", "E"
|
56
|
+
sub "Ж", "Ž" # Ž
|
57
|
+
sub "З", "Z"
|
58
|
+
sub "И", "I"
|
59
|
+
sub "Ј", "J"
|
60
|
+
sub "К", "K"
|
61
|
+
sub "Л", "L"
|
62
|
+
sub "Љ", "Lj"
|
63
|
+
sub "М", "M"
|
64
|
+
sub "Н", "N"
|
65
|
+
sub "Њ", "Nj"
|
66
|
+
sub "О", "O"
|
67
|
+
sub "П", "P"
|
68
|
+
sub "Р", "R"
|
69
|
+
sub "С", "S"
|
70
|
+
sub "Т", "T"
|
71
|
+
sub "Ћ", "Ć" # Ć
|
72
|
+
sub "У", "U"
|
73
|
+
sub "Ф", "F"
|
74
|
+
sub "Х", "H"
|
75
|
+
sub "Ц", "C"
|
76
|
+
sub "Ч", "Č" # Č
|
77
|
+
sub "Џ", "Dž" # Dž
|
78
|
+
sub "Ш", "Š" # Š
|
79
|
+
sub "а", "a"
|
80
|
+
sub "б", "b"
|
81
|
+
sub "в", "v"
|
82
|
+
sub "г", "g"
|
83
|
+
sub "д", "d"
|
84
|
+
sub "ђ", "đ" # đ
|
85
|
+
sub "е", "e"
|
86
|
+
sub "ж", "ž" # ž
|
87
|
+
sub "з", "z"
|
88
|
+
sub "и", "i"
|
89
|
+
sub "ј", "j"
|
90
|
+
sub "к", "k"
|
91
|
+
sub "л", "l"
|
92
|
+
sub "љ", "lj"
|
93
|
+
sub "м", "m"
|
94
|
+
sub "н", "n"
|
95
|
+
sub "њ", "nj"
|
96
|
+
sub "о", "o"
|
97
|
+
sub "п", "p"
|
98
|
+
sub "р", "r"
|
99
|
+
sub "с", "s"
|
100
|
+
sub "т", "t"
|
101
|
+
sub "ћ", "ć" # ć́
|
102
|
+
sub "у", "u"
|
103
|
+
sub "ф", "f"
|
104
|
+
sub "х", "h"
|
105
|
+
sub "ц", "c"
|
106
|
+
sub "ч", "č" # č
|
107
|
+
sub "џ", "dž" # dž
|
108
|
+
sub "ш", "š" # š
|
109
|
+
}
|
110
|
+
|
111
|
+
# POSTRULES
|
112
|
+
sub srp_multichar, upcase, before: srp_latupper
|
113
|
+
sub srp_multichar, upcase, after: srp_latupper
|
114
|
+
compose
|
115
|
+
}
|
@@ -0,0 +1,52 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:tam
|
5
|
+
source_script: Taml
|
6
|
+
destination_script: Latn
|
7
|
+
name: Tamil Romanization, 1997
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/tamil.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Tamil
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
+
made in transliteration.
|
18
|
+
|
19
|
+
- |
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
+
transliteration, with the following exceptions:
|
22
|
+
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
24
|
+
b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
|
25
|
+
|
26
|
+
- This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
|
27
|
+
}
|
28
|
+
|
29
|
+
tests {
|
30
|
+
test "அழிந்து போன நகரத்தில் , தொலைந்து போன நான்", "aḻintu pōṉa nakarattil , tolaintu pōṉa nāṉ"
|
31
|
+
test "முதன் முதலாக - மை ஃபர்ஸ்ட் சோலோ ட்ராவல்", "mutaṉ mutalāka - mai ḵaparsṭ cōlō ṭrāval"
|
32
|
+
test "வாழ்க்கையில் அவன் போன முதல் சோலோ டிரிப் அது தான்.", "vāḻkkaiyil avaṉ pōṉa mutal cōlō ṭirip atu tāṉ."
|
33
|
+
test "ஸ்கூல் ப்ரெண்ட் கார்த்திக் வீட்டுக்கு போய்ட்டு", "skūl preṇṭ kārttik vīṭṭukku pōyṭṭu"
|
34
|
+
test "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ", "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
|
35
|
+
test "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ", "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
|
36
|
+
test "டார்பிடோவை ஏவ உதவும் சூப்பர்சானிக் ஏவுகணையான ஸ்மார்ட் சோதனை வெற்றி", "ṭārpiṭōvai ēva utavum cūpparcāṉik ēvukaṇaiyāṉa smārṭ cōtaṉai veṟṟi"
|
37
|
+
test "இந்த ஆண்டு மருத்துவத்துக்கான நோபல் பரிசு பெறுபவர்களின் பெயர்கள் அறிவிப்பு", "inta āṇṭu maruttuvattukkāṉa nōpal paricu peṟupavarkaḷiṉ peyarkaḷ aṟivippu"
|
38
|
+
test "மல்லையா விவகாரம்: பிரிட்டன் அரசின் நடவடிக்கைகள் தங்களுக்கு தெரியவில்லை - மத்திய அரசு தகவல்", "mallaiyā vivakāram: piriṭṭaṉ araciṉ naṭavaṭikkaikaḷ taṅkaḷukku teriyavillai - mattiya aracu takaval"
|
39
|
+
test "ஆலோசனைக்குப் பிறகு தேனியில் இருந்து சென்னை புறப்பட்டார் துணை முதலமைச்சர் பன்னீர்செல்வம்", "ālōcaṉaikkup piṟaku tēṉiyil iruntu ceṉṉai puṟappaṭṭār tuṇai mutalamaiccar paṉṉīrcelvam"
|
40
|
+
test "இன்று தான் பேரன் பிறந்தநாள் முடிந்து ஃப்ரீ ஆகி இருக்கிறேன்", "iṉṟu tāṉ pēraṉ piṟantanāḷ muṭintu ḵaprī āki irukkiṟēṉ"
|
41
|
+
}
|
42
|
+
|
43
|
+
dependency "din-tam-Taml-Latn-33903-2016", as: tamllatn
|
44
|
+
|
45
|
+
stage {
|
46
|
+
# CHARACTERS
|
47
|
+
parallel {
|
48
|
+
sub "ஃ", "ḵa"
|
49
|
+
}
|
50
|
+
|
51
|
+
run map.tamllatn.stage.main
|
52
|
+
}
|
@@ -0,0 +1,49 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 2011
|
4
|
+
language: iso-639-2:tam
|
5
|
+
source_script: Taml
|
6
|
+
destination_script: Latn
|
7
|
+
name: Tamil Romanization, 2011
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/tamil.pdf
|
9
|
+
creation_date: 2011
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Tamil
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
+
made in transliteration.
|
18
|
+
|
19
|
+
- |
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
+
transliteration, with the following exceptions:
|
22
|
+
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
24
|
+
b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
|
25
|
+
|
26
|
+
- This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
|
27
|
+
}
|
28
|
+
|
29
|
+
tests {
|
30
|
+
test "மலையாள நடிகர் சங்கத்திலிருந்து நடிகை பார்வதி திடீர் விலகல்.", "malaiyāḷa naṭikar caṅkattiliruntu naṭikai pārvati tiṭīr vilakal."
|
31
|
+
test "சச்சின் டெண்டுல்கரை அலுவலக உதவியாளராக நியமிப்பீர்களா?", "cacciṉ ṭeṇṭulkarai aluvalaka utaviyāḷarāka niyamippīrkaḷā?"
|
32
|
+
test "அமீரகத்தில் தொலைநோக்கி இல்லாமல் நாளை பார்க்கலாம்", "amīrakattil tolainōkki illāmal nāḷai pārkkalām"
|
33
|
+
test "லடாக் யூனியன் பிரதேசம் இந்தியா சட்டவிரோதமாக நிறுவிய ஒரு பகுதி- சீனா மீண்டும் பிடிவாதம்", "laṭāk yūṉiyaṉ piratēcam intiyā caṭṭavirōtamāka niṟuviya oru pakuti- cīṉā mīṇṭum piṭivātam"
|
34
|
+
test "பாலியல் குற்றங்களில் ஈடுபடுவோருக்கு மரண தண்டனை புதிய சட்டம்", "pāliyal kuṟṟaṅkaḷil īṭupaṭuvōrukku maraṇa taṇṭaṉai putiya caṭṭam"
|
35
|
+
test "புதுடெல்லி", "putuṭelli"
|
36
|
+
test "அப்படி விளம்பரத்தில என்ன இருக்கு...?", "appaṭi viḷamparattila eṉṉa irukku...?"
|
37
|
+
test "பூமிக்கும், செவ்வாய் கிரகத்துக்கும் இடையிலான அதிகபட்ச தூரம் ௪௦ கோடியே ௧௩ லட்சம் கி.மீ தொலைவு ஆகும்.", "pūmikkum, cevvāy kirakattukkum iṭaiyilāṉa atikapaṭca tūram 40 kōṭiyē 13 laṭcam ki.mī tolaivu ākum."
|
38
|
+
test "அமீரகத்தில் செவ்வாய் கிரகம் குறித்த ஆய்வில் ஈடுபடுவோர் மற்றும் வானியல் நிபுணர்களுக்கு இது ஒரு நல்ல வாய்ப்பாக அமையும்.", "amīrakattil cevvāy kirakam kuṟitta āyvil īṭupaṭuvōr maṟṟum vāṉiyal nipuṇarkaḷukku itu oru nalla vāyppāka amaiyum."
|
39
|
+
test "நள்ளிரவு நேரமாக இருந்தால் நமது தலைக்கு மேலே காணலாம். காலை நேரத்தில் மேற்கு மற்றும் தென்மேற்கு திசையில் செவ்வாய் கிரகத்தை பார்க்கலாம்.", "naḷḷiravu nēramāka iruntāl namatu talaikku mēlē kāṇalām. kālai nērattil mēṟku maṟṟum teṉmēṟku ticaiyil cevvāy kirakattai pārkkalām."
|
40
|
+
test "வெறும் கண்ணால் பார்க்கும்போது புள்ளியாக ஆரஞ்சு நிறத்தில் பிரகாசமாக தெரியும்.", "veṟum kaṇṇāl pārkkumpōtu puḷḷiyāka ārañcu niṟattil pirakācamāka teriyum."
|
41
|
+
}
|
42
|
+
|
43
|
+
dependency "alalc-tam-Taml-Latn-1997", as: tamllatn
|
44
|
+
|
45
|
+
stage {
|
46
|
+
|
47
|
+
run map.tamllatn.stage.main
|
48
|
+
|
49
|
+
}
|
@@ -0,0 +1,237 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:tel
|
5
|
+
source_script: Telu
|
6
|
+
destination_script: Latn
|
7
|
+
name: Telugu Romanization, 1997
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/telugu.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Telugu
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- |
|
16
|
+
Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
17
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
18
|
+
made in transliteration.
|
19
|
+
- |
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
+
transliteration, with the following exceptions:
|
22
|
+
a) when another vowel is indicated by its appropriate sign; and
|
23
|
+
b) when the absence of any vowel is indicated by the superscript sign ( ౬ ) called valapalagilaka.
|
24
|
+
- |
|
25
|
+
Exception: Sunna is transliterated by:
|
26
|
+
a) ṅ before gutturals,
|
27
|
+
b) ñ before palatals,
|
28
|
+
c) ṇ before cerebrals,
|
29
|
+
d) n before dentals, and
|
30
|
+
e) m before labials.
|
31
|
+
- |
|
32
|
+
Ardhasunna before gutturals and palatal, cerebral, and dental occlusives is transliterated n̐.
|
33
|
+
Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
|
34
|
+
transliterated m
|
35
|
+
}
|
36
|
+
|
37
|
+
tests {
|
38
|
+
test "తమిళనాడు", "tamiḷanāḍu"
|
39
|
+
test "తంటికొండ ఘటన: ఆగని మృత్యుఘోష", "taṃṭikoṇḍa ghaṭana: āgani mṛtayughŏṣa"
|
40
|
+
test "మళ్లీ వివాదం: అమితాబ్పై కేసు", "maḷalī vivādaṃ: amitābapai kēsu"
|
41
|
+
test "‘వరద సాయం పేరుతో వైట్ కాలర్ దోపిడీ’", "‘varada sāyaṃ pērutŏ vaiṭa kālara dŏpiḍī’"
|
42
|
+
test "రెండో విడత జీఎస్టీ పరిహారం", "reṃḍŏ viḍata jīesaṭī parihāraṃ"
|
43
|
+
test "నితీష్ కుమార్ అధ్యాయం ముగిసినట్లేనా?!", "nitīṣa kumāra adhayāyaṃ mugisinaṭalēnā?!"
|
44
|
+
test "వారిపై జీవితాంతం నిషేధం విధించండి!", "vāripai jīvitāntaṃ niṣēdhaṃ vidhiñcaṃḍi!"
|
45
|
+
test "మరో లాక్డౌన్ వల్ల అన్నీ అనర్థాలే!", "marŏ lākaḍauna valala ananī anarathālē!"
|
46
|
+
test "జెసిండా మరో సంచలనం", "jesiṃḍā marŏ sañcalanaṃ"
|
47
|
+
test "స్వీయ నిర్బంధంలోకి డబ్ల్యూహెచ్ఓ డైరెక్టర్", "savīya nirabandhaṃlŏki ḍabalayūhecaō ḍairekaṭara"
|
48
|
+
test "కరోనాపై యుద్ధంలో సమిధలు", "karŏnāpai yudadhaṃlŏ samidhalu"
|
49
|
+
test "అమెరికా ఎన్నికలు: ‘పెద్దన్న’ ఎవరో?!", "amerikā enanikalu: ‘pedadanana’ evarŏ?!"
|
50
|
+
test "౪౬౨౬౯", "46269"
|
51
|
+
}
|
52
|
+
|
53
|
+
aliases {
|
54
|
+
def_alias telu_chars_1, any("\u0c3e\u0c3f\u0c40\u0c41\u0c42\u0c43\u0c46\u0c47\u0c48\u0c4a\u0c4b\u0c4c\u0c6c")
|
55
|
+
}
|
56
|
+
|
57
|
+
stage {
|
58
|
+
|
59
|
+
# RULES
|
60
|
+
# rule II
|
61
|
+
sub "క", "k", after: telu_chars_1
|
62
|
+
sub "ఖ", "kh", after: telu_chars_1
|
63
|
+
sub "గ", "g", after: telu_chars_1
|
64
|
+
sub "ఘ", "gh", after: telu_chars_1
|
65
|
+
sub "ఙ", "ṅ", after: telu_chars_1
|
66
|
+
sub "చ", "c", after: telu_chars_1
|
67
|
+
sub "ౘ", "ĉ", after: telu_chars_1
|
68
|
+
sub "ఛ", "ch", after: telu_chars_1
|
69
|
+
sub "జ", "j", after: telu_chars_1
|
70
|
+
sub "ౙ", "ĵ", after: telu_chars_1
|
71
|
+
sub "ఝ", "jh", after: telu_chars_1
|
72
|
+
sub "ఞ", "ñ", after: telu_chars_1
|
73
|
+
sub "ట", "ṭ", after: telu_chars_1
|
74
|
+
sub "ఠ", "ṭh", after: telu_chars_1
|
75
|
+
sub "డ", "ḍ", after: telu_chars_1
|
76
|
+
sub "ఢ", "ḍh", after: telu_chars_1
|
77
|
+
sub "ణ", "ṇ", after: telu_chars_1
|
78
|
+
sub "త", "t", after: telu_chars_1
|
79
|
+
sub "థ", "th", after: telu_chars_1
|
80
|
+
sub "ద", "d", after: telu_chars_1
|
81
|
+
sub "ధ", "dh", after: telu_chars_1
|
82
|
+
sub "న", "n", after: telu_chars_1
|
83
|
+
sub "ప", "p", after: telu_chars_1
|
84
|
+
sub "ఫ", "ph", after: telu_chars_1
|
85
|
+
sub "బ", "b", after: telu_chars_1
|
86
|
+
sub "భ", "bh", after: telu_chars_1
|
87
|
+
sub "మ", "m", after: telu_chars_1
|
88
|
+
sub "య", "y", after: telu_chars_1
|
89
|
+
sub "ర", "r", after: telu_chars_1
|
90
|
+
sub "ఱ", "ṛ", after: telu_chars_1
|
91
|
+
sub "ల", "l", after: telu_chars_1
|
92
|
+
sub "ళ", "ḷ", after: telu_chars_1
|
93
|
+
sub "వ", "v", after: telu_chars_1
|
94
|
+
sub "శ", "ś", after: telu_chars_1
|
95
|
+
sub "ష", "ṣ", after: telu_chars_1
|
96
|
+
sub "స", "s", after: telu_chars_1
|
97
|
+
sub "హ", "h", after: telu_chars_1
|
98
|
+
|
99
|
+
# rule III
|
100
|
+
sub "\u0C02", "ṅ", after: any("కఖగఘఙ")
|
101
|
+
sub "\u0C02", "ñ", after: any("చౘఛజౙఝఞ")
|
102
|
+
sub "\u0C02", "ṇ", after: any("టఠడఢణ")
|
103
|
+
sub "\u0C02", "n", after: any("తథదధన")
|
104
|
+
sub "\u0C02", "m", after: any("పఫబభమ")
|
105
|
+
|
106
|
+
# rule IV
|
107
|
+
sub "\u0C01", "n̐", after: any("కఖగఘఙచౘఛజౙఝఞటఠడఢణతథదధన") # before guttural, palatal, cerebral, and dental
|
108
|
+
|
109
|
+
|
110
|
+
# CHARACTERS
|
111
|
+
parallel {
|
112
|
+
|
113
|
+
sub "అ", "a"
|
114
|
+
sub "ఆ", "ā"
|
115
|
+
sub "ఇ", "i"
|
116
|
+
sub "ఈ", "ī"
|
117
|
+
sub "ఉ", "u"
|
118
|
+
sub "ఊ", "ū"
|
119
|
+
sub "ఋ", "ṛ"
|
120
|
+
sub "ౠ", "ṝ"
|
121
|
+
sub "ఌ", "ḻ"
|
122
|
+
sub "ఎ", "e"
|
123
|
+
sub "ఏ", "ē"
|
124
|
+
sub "ఐ", "ai"
|
125
|
+
sub "ఒ", "o"
|
126
|
+
sub "ఓ", "ō"
|
127
|
+
sub "ఔ", "au"
|
128
|
+
|
129
|
+
# Gutturals
|
130
|
+
sub "క", "ka"
|
131
|
+
sub "ఖ", "kha"
|
132
|
+
sub "గ", "ga"
|
133
|
+
sub "ఘ", "gha"
|
134
|
+
sub "ఙ", "ṅa"
|
135
|
+
|
136
|
+
# Palatals
|
137
|
+
sub "చ", "ca"
|
138
|
+
sub "ౘ", "ĉa"
|
139
|
+
sub "ఛ", "cha"
|
140
|
+
sub "జ", "ja"
|
141
|
+
sub "ౙ", "ĵa"
|
142
|
+
sub "ఝ", "jha"
|
143
|
+
sub "ఞ", "ña"
|
144
|
+
|
145
|
+
# Cerebrals
|
146
|
+
sub "ట", "ṭa"
|
147
|
+
sub "ఠ", "ṭha"
|
148
|
+
sub "డ", "ḍa"
|
149
|
+
sub "ఢ", "ḍha"
|
150
|
+
sub "ణ", "ṇa"
|
151
|
+
|
152
|
+
# Dentals
|
153
|
+
sub "త", "ta"
|
154
|
+
sub "థ", "tha"
|
155
|
+
sub "ద", "da"
|
156
|
+
sub "ధ", "dha"
|
157
|
+
sub "న", "na"
|
158
|
+
|
159
|
+
# Labials
|
160
|
+
sub "ప", "pa"
|
161
|
+
sub "ఫ", "pha"
|
162
|
+
sub "బ", "ba"
|
163
|
+
sub "భ", "bha"
|
164
|
+
sub "మ", "ma"
|
165
|
+
|
166
|
+
# Semivowels
|
167
|
+
sub "య", "ya"
|
168
|
+
sub "ర", "ra"
|
169
|
+
sub "ఱ", "ṛa"
|
170
|
+
sub "ల", "la"
|
171
|
+
sub "ళ", "ḷa"
|
172
|
+
sub "వ", "va"
|
173
|
+
|
174
|
+
# Sibilants
|
175
|
+
sub "శ", "śa"
|
176
|
+
sub "ష", "ṣa"
|
177
|
+
sub "స", "sa"
|
178
|
+
|
179
|
+
|
180
|
+
|
181
|
+
# Aspirate
|
182
|
+
sub "హ", "ha"
|
183
|
+
|
184
|
+
|
185
|
+
|
186
|
+
# Chandrabindu
|
187
|
+
sub "ঁ", "m̐"
|
188
|
+
sub "ఁ", "m̐"
|
189
|
+
|
190
|
+
# Bisarga
|
191
|
+
sub "ః", "ḥ"
|
192
|
+
|
193
|
+
# Anusvāra
|
194
|
+
sub "ం", "ṃ"
|
195
|
+
|
196
|
+
# Medials # Needed for connecting constants
|
197
|
+
|
198
|
+
sub "ా", "ā"
|
199
|
+
sub "ి", "i"
|
200
|
+
sub "ీ", "ī"
|
201
|
+
sub "ు", "u"
|
202
|
+
sub "ూ", "ū"
|
203
|
+
sub "ృ", "ṛ"
|
204
|
+
sub "ె", "e"
|
205
|
+
sub "ే", "ē"
|
206
|
+
sub "ై", "ai"
|
207
|
+
sub "ొ", "o"
|
208
|
+
sub "ో", "ŏ"
|
209
|
+
sub "ౌ", "au"
|
210
|
+
sub "\u09CD", "" # Used for joining
|
211
|
+
|
212
|
+
|
213
|
+
sub "\u0c4d", "" #verma sign for halanta
|
214
|
+
sub "ౕ\t", ""
|
215
|
+
sub "ౖ\t", ""
|
216
|
+
sub "्", ""
|
217
|
+
sub "़", ""
|
218
|
+
sub "", "" # Used for joining
|
219
|
+
sub "", "" # Used for non joining
|
220
|
+
|
221
|
+
# numbers
|
222
|
+
|
223
|
+
sub "౦", "0"
|
224
|
+
sub "౧", "1"
|
225
|
+
sub "౨", "2"
|
226
|
+
sub "౩", "3"
|
227
|
+
sub "౪", "4"
|
228
|
+
sub "౫", "5"
|
229
|
+
sub "౬", "6"
|
230
|
+
sub "౭", "7"
|
231
|
+
sub "౮", "8"
|
232
|
+
sub "౯", "9"
|
233
|
+
}
|
234
|
+
|
235
|
+
compose
|
236
|
+
}
|
237
|
+
|