interscript-maps 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
|
@@ -0,0 +1,356 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: ungegn
|
|
3
|
+
id: 2016
|
|
4
|
+
language: iso-639-2:hin
|
|
5
|
+
source_script: Deva
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
|
|
8
|
+
url: https://www.eki.ee/wgrs/rom1_hi.pdf
|
|
9
|
+
creation_date: 1972
|
|
10
|
+
confirmation_date: 2016
|
|
11
|
+
description: |
|
|
12
|
+
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
|
|
13
|
+
(III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
|
|
14
|
+
published in volume II of the conference reports.
|
|
15
|
+
|
|
16
|
+
There is no evidence of the use of the system either in India or in international cartographic
|
|
17
|
+
products. It was stated in 1987 that the appropriate resolution had not been implemented in
|
|
18
|
+
India and the Hunterian system was still in use in large-scale mapping
|
|
19
|
+
|
|
20
|
+
Hindi uses the alphasyllabic script Devanāgarī whereby each character represents a syllable
|
|
21
|
+
rather than one sound. Vowels and diphthongs are marked in two ways: as independent
|
|
22
|
+
characters (used syllable-initially) and in an abbreviated form, to denote vowels after
|
|
23
|
+
consonants. The romanization table is unambiguous but the user would have to recognize
|
|
24
|
+
many ligatures not given in the original table (only three are given). The system is mostly
|
|
25
|
+
reversible but there may exist some ambiguities in the romanization of vowels (independent
|
|
26
|
+
vs. abbreviated characters) and consonants
|
|
27
|
+
|
|
28
|
+
notes:
|
|
29
|
+
- |
|
|
30
|
+
It is recommended that the vowel अ (a) should always be romanized except when it ends a
|
|
31
|
+
name. If a name ends with a consonant, the consonant should carry a sub-macron. Such
|
|
32
|
+
cases, however, will be very rare. For example, कानपुर Kānapur (not Kānapura), जगत्
|
|
33
|
+
Jagat.
|
|
34
|
+
- |
|
|
35
|
+
If each letter of a digraph or any two parts of a trigraph has a distinct independent sound
|
|
36
|
+
then it should be indicated by a hyphen, thus d-h.
|
|
37
|
+
|
|
38
|
+
######################################## Additional Note ############################################################
|
|
39
|
+
# It is recommended that the vowel अ (a) should always be romanized except when it ends a #
|
|
40
|
+
# name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
|
|
41
|
+
# we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
|
|
42
|
+
# so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
|
|
43
|
+
#####################################################################################################################
|
|
44
|
+
}
|
|
45
|
+
|
|
46
|
+
tests {
|
|
47
|
+
test "दिल्ली", "dillī"
|
|
48
|
+
test "भारत", "bhārat"
|
|
49
|
+
test "परिपक्क", "paripakk"
|
|
50
|
+
test "जगत्", "jagat"
|
|
51
|
+
test "संख्या", "saṁkhyā"
|
|
52
|
+
test "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर", "gaṁbhīr marījoṁ ke māmale meṁ bhārat dūsare naṁbar par"
|
|
53
|
+
test "कोरोना अपडेट्स", "koronā apaḍeṭs"
|
|
54
|
+
test "सीडीसी चीफ का बयान अहम", "sīḍīsī chīph kā bayān aham"
|
|
55
|
+
test "गूगल प्ले स्टोर पर पेटीएम की वापसी", "gūgal ple sṭor par peṭīem kī vāpasī"
|
|
56
|
+
test "भारत में गैंबलिंग की इजाजत नहीं", "bhārat meṁ gaiṁbaliṁg kī ijājat nahīṁ"
|
|
57
|
+
test "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं", "koronā vaiksīn mudde par ghire rāṣhṭrapati; jo bāiḍen bole- mujhe aur desh ko vaijñānikoṁ par bharosā hai, ḍonālḍ ṭramp par nahīṁ"
|
|
58
|
+
test "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं", "gūgal kī kārravāī par peṭīem ne kahā thā ki aip ko asthāyī taur par ple-sṭor se haṭāyā gayā hai, āpake paise surakṣhit haiṁ"
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
|
|
62
|
+
aliases {
|
|
63
|
+
def_alias deva_characters_1, any("\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d")
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
stage {
|
|
67
|
+
|
|
68
|
+
# RULES
|
|
69
|
+
sub "क" + maybe("="), "k", after: deva_characters_1
|
|
70
|
+
sub "क", "k", after: boundary
|
|
71
|
+
|
|
72
|
+
sub "ख" + maybe("="), "kh", after: deva_characters_1
|
|
73
|
+
sub "ख", "kh", after: boundary
|
|
74
|
+
|
|
75
|
+
sub "ग" + maybe("="), "g", after: deva_characters_1
|
|
76
|
+
sub "ग", "g", after: boundary
|
|
77
|
+
|
|
78
|
+
sub "घ" + maybe("="), "gh", after: deva_characters_1
|
|
79
|
+
sub "घ", "gh", after: boundary
|
|
80
|
+
|
|
81
|
+
sub "ङ" + maybe("="), "ṅ", after: deva_characters_1
|
|
82
|
+
sub "ङ", "ṅ", after: boundary
|
|
83
|
+
|
|
84
|
+
sub "च" + maybe("="), "ch", after: deva_characters_1
|
|
85
|
+
sub "च", "ch", after: boundary
|
|
86
|
+
|
|
87
|
+
sub "छ" + maybe("="), "chh", after: deva_characters_1
|
|
88
|
+
sub "छ", "chh", after: boundary
|
|
89
|
+
|
|
90
|
+
sub "ज" + maybe("="), "j", after: deva_characters_1
|
|
91
|
+
sub "ज", "j", after: boundary
|
|
92
|
+
|
|
93
|
+
sub "झ" + maybe("="), "jh", after: deva_characters_1
|
|
94
|
+
sub "झ", "jh", after: boundary
|
|
95
|
+
|
|
96
|
+
sub "ञ" + maybe("="), "ñ", after: deva_characters_1
|
|
97
|
+
sub "ञ", "ñ", after: boundary
|
|
98
|
+
|
|
99
|
+
sub "ट" + maybe("="), "ṭ", after: deva_characters_1
|
|
100
|
+
sub "ट", "ṭ", after: boundary
|
|
101
|
+
|
|
102
|
+
sub "ठ" + maybe("="), "ṭh", after: deva_characters_1
|
|
103
|
+
sub "ठ", "ṭh", after: boundary
|
|
104
|
+
|
|
105
|
+
sub "ड" + maybe("="), "ḍ", after: deva_characters_1
|
|
106
|
+
sub "ड", "ḍ", after: boundary
|
|
107
|
+
|
|
108
|
+
sub "ढ" + maybe("="), "ḍh", after: deva_characters_1
|
|
109
|
+
sub "ढ", "ḍh", after: boundary
|
|
110
|
+
|
|
111
|
+
sub "ण" + maybe("="), "ṇ", after: deva_characters_1
|
|
112
|
+
sub "ण", "ṇ", after: boundary
|
|
113
|
+
|
|
114
|
+
sub "त" + maybe("="), "t", after: deva_characters_1
|
|
115
|
+
sub "त", "t", after: boundary
|
|
116
|
+
|
|
117
|
+
sub "थ" + maybe("="), "th", after: deva_characters_1
|
|
118
|
+
sub "थ", "th", after: boundary
|
|
119
|
+
|
|
120
|
+
sub "द" + maybe("="), "d", after: deva_characters_1
|
|
121
|
+
sub "द", "d", after: boundary
|
|
122
|
+
|
|
123
|
+
sub "ध" + maybe("="), "dh", after: deva_characters_1
|
|
124
|
+
sub "ध", "dh", after: boundary
|
|
125
|
+
|
|
126
|
+
sub "न" + maybe("="), "n", after: deva_characters_1
|
|
127
|
+
sub "न", "n", after: boundary
|
|
128
|
+
|
|
129
|
+
sub "प" + maybe("="), "p", after: deva_characters_1
|
|
130
|
+
sub "प", "p", after: boundary
|
|
131
|
+
|
|
132
|
+
sub "फ" + maybe("="), "ph", after: deva_characters_1
|
|
133
|
+
sub "फ", "ph", after: boundary
|
|
134
|
+
|
|
135
|
+
sub "ब" + maybe("="), "b", after: deva_characters_1
|
|
136
|
+
sub "ब", "b", after: boundary
|
|
137
|
+
|
|
138
|
+
sub "भ" + maybe("="), "bh", after: deva_characters_1
|
|
139
|
+
sub "भ", "bh", after: boundary
|
|
140
|
+
|
|
141
|
+
sub "म" + maybe("="), "m", after: deva_characters_1
|
|
142
|
+
sub "म", "m", after: boundary
|
|
143
|
+
|
|
144
|
+
sub "य" + maybe("="), "y", after: deva_characters_1
|
|
145
|
+
sub "य", "y", after: boundary
|
|
146
|
+
|
|
147
|
+
sub "र" + maybe("="), "r", after: deva_characters_1
|
|
148
|
+
sub "र", "r", after: boundary
|
|
149
|
+
|
|
150
|
+
sub "ल" + maybe("="), "l", after: deva_characters_1
|
|
151
|
+
sub "ल", "l", after: boundary
|
|
152
|
+
|
|
153
|
+
sub "व" + maybe("="), "v", after: deva_characters_1
|
|
154
|
+
sub "व", "v", after: boundary
|
|
155
|
+
|
|
156
|
+
sub "श" + maybe("="), "sh", after: deva_characters_1
|
|
157
|
+
sub "श", "sh", after: boundary
|
|
158
|
+
|
|
159
|
+
sub "ष" + maybe("="), "ṣh", after: deva_characters_1
|
|
160
|
+
sub "ष", "ṣh", after: boundary
|
|
161
|
+
|
|
162
|
+
sub "स" + maybe("="), "s", after: deva_characters_1
|
|
163
|
+
sub "स", "s", after: boundary
|
|
164
|
+
|
|
165
|
+
sub "क़" + maybe("="), "q", after: deva_characters_1
|
|
166
|
+
sub "क़", "q", after: boundary
|
|
167
|
+
|
|
168
|
+
sub "ख़" + maybe("="), "ḳh", after: deva_characters_1
|
|
169
|
+
sub "ख़", "ḳh", after: boundary
|
|
170
|
+
|
|
171
|
+
sub "ग़" + maybe("="), "g", after: deva_characters_1
|
|
172
|
+
sub "ग़", "g", after: boundary
|
|
173
|
+
|
|
174
|
+
sub "ज़" + maybe("="), "z", after: deva_characters_1
|
|
175
|
+
sub "ज़", "z", after: boundary
|
|
176
|
+
|
|
177
|
+
sub "ड़" + maybe("="), "ṙ", after: deva_characters_1
|
|
178
|
+
sub "ड़", "ṙ", after: boundary
|
|
179
|
+
|
|
180
|
+
sub "ढ़" + maybe("="), "ṙh", after: deva_characters_1
|
|
181
|
+
sub "ढ़", "ṙh", after: boundary
|
|
182
|
+
|
|
183
|
+
sub "फ़" + maybe("="), "f", after: deva_characters_1
|
|
184
|
+
sub "फ़", "f", after: boundary
|
|
185
|
+
|
|
186
|
+
sub "ह" + maybe("="), "h", after: deva_characters_1
|
|
187
|
+
sub "ह", "h", after: boundary
|
|
188
|
+
|
|
189
|
+
|
|
190
|
+
# CHARACTERS
|
|
191
|
+
parallel {
|
|
192
|
+
|
|
193
|
+
# I. Independent vowel characters
|
|
194
|
+
sub "अ", "a"
|
|
195
|
+
sub "आ", "ā"
|
|
196
|
+
sub "इ", "i"
|
|
197
|
+
sub "ई", "ī"
|
|
198
|
+
sub "उ", "u"
|
|
199
|
+
sub "ऊ", "ū"
|
|
200
|
+
sub "ऋ", "ṛ"
|
|
201
|
+
sub "ॠ", "ṝ"
|
|
202
|
+
sub "ऌ", "l̤"
|
|
203
|
+
sub "ए", "e"
|
|
204
|
+
sub "ऐ", "ai"
|
|
205
|
+
sub "ओ", "o"
|
|
206
|
+
sub "औ", "au"
|
|
207
|
+
|
|
208
|
+
# II. Abbreviated vowel characters
|
|
209
|
+
|
|
210
|
+
sub "ा", "ā" # का
|
|
211
|
+
sub "ॉ", "ā̆ " # additional mark: कॉ
|
|
212
|
+
sub "ि", "i" # कि i
|
|
213
|
+
sub "ी", "ī" # की
|
|
214
|
+
sub "ु", "u" # कु
|
|
215
|
+
sub "ू", "ū" # कू
|
|
216
|
+
sub "ृ", "ṛ" # कृ
|
|
217
|
+
sub "े", "e" # के
|
|
218
|
+
sub "ै", "ai" # कै
|
|
219
|
+
sub "ो", "o" # को
|
|
220
|
+
sub "ौ", "au" # कौ
|
|
221
|
+
|
|
222
|
+
|
|
223
|
+
# Consonants (see Note 1)
|
|
224
|
+
|
|
225
|
+
# Gutturals
|
|
226
|
+
sub "क", "ka"
|
|
227
|
+
sub "ख", "kha"
|
|
228
|
+
sub "ग", "ga"
|
|
229
|
+
sub "घ", "gha"
|
|
230
|
+
sub "ङ", "ṅa"
|
|
231
|
+
|
|
232
|
+
# Palatals
|
|
233
|
+
sub "च", "cha"
|
|
234
|
+
sub "छ", "chha"
|
|
235
|
+
sub "ज", "ja"
|
|
236
|
+
sub "झ", "jha"
|
|
237
|
+
sub "ञ", "ña"
|
|
238
|
+
|
|
239
|
+
# Cerebrals
|
|
240
|
+
sub "ट", "ṭa"
|
|
241
|
+
sub "ठ", "ṭha"
|
|
242
|
+
sub "ड", "ḍa"
|
|
243
|
+
sub "ढ", "ḍha"
|
|
244
|
+
sub "ण", "ṇa"
|
|
245
|
+
|
|
246
|
+
# Dentals
|
|
247
|
+
sub "त", "ta"
|
|
248
|
+
sub "थ", "tha"
|
|
249
|
+
sub "द", "da"
|
|
250
|
+
sub "ध", "dha"
|
|
251
|
+
sub "न", "na"
|
|
252
|
+
|
|
253
|
+
# Labials
|
|
254
|
+
sub "प", "pa"
|
|
255
|
+
sub "फ", "pha"
|
|
256
|
+
sub "ब", "ba"
|
|
257
|
+
sub "भ", "bha"
|
|
258
|
+
sub "म", "ma"
|
|
259
|
+
|
|
260
|
+
# Semivowels
|
|
261
|
+
sub "य", "ya"
|
|
262
|
+
sub "र", "ra"
|
|
263
|
+
sub "ल", "la"
|
|
264
|
+
sub "व", "va"
|
|
265
|
+
|
|
266
|
+
# Sibilants
|
|
267
|
+
sub "श", "sha"
|
|
268
|
+
sub "ष", "ṣha"
|
|
269
|
+
sub "स", "sa"
|
|
270
|
+
|
|
271
|
+
# Dotted variants
|
|
272
|
+
sub "क़", "qa"
|
|
273
|
+
sub "ख़", "ḳha"
|
|
274
|
+
sub "ग़", "ġa"
|
|
275
|
+
sub "ज़", "za"
|
|
276
|
+
sub "ड़", "ṙa"
|
|
277
|
+
sub "ढ़", "ṙha"
|
|
278
|
+
sub "फ़", "fa"
|
|
279
|
+
|
|
280
|
+
|
|
281
|
+
# Aspirate
|
|
282
|
+
sub "ह", "ha"
|
|
283
|
+
|
|
284
|
+
# Anusvāra
|
|
285
|
+
sub "ं", "ṁ"
|
|
286
|
+
|
|
287
|
+
# Anunāsika
|
|
288
|
+
sub "ँ", "m̐"
|
|
289
|
+
|
|
290
|
+
# halanta
|
|
291
|
+
sub "्", ""
|
|
292
|
+
|
|
293
|
+
# bisharga
|
|
294
|
+
sub "ः", "ḥ"
|
|
295
|
+
|
|
296
|
+
#V. Ligatures(To cover all Ligatures at unicode)
|
|
297
|
+
# Implemnting Pronunciation without a vowel: क् k.
|
|
298
|
+
|
|
299
|
+
# Gutturals
|
|
300
|
+
sub "क्", "k"
|
|
301
|
+
sub "ख्", "kh"
|
|
302
|
+
sub "ग्", "g"
|
|
303
|
+
sub "घ्", "gh"
|
|
304
|
+
sub "ङ्", "ṅ"
|
|
305
|
+
|
|
306
|
+
# Palatals
|
|
307
|
+
sub "च्", "ch"
|
|
308
|
+
sub "छ्", "chh"
|
|
309
|
+
sub "ज्", "j"
|
|
310
|
+
sub "झ्", "jh"
|
|
311
|
+
sub "ञ्", "ñ"
|
|
312
|
+
|
|
313
|
+
# Cerebrals
|
|
314
|
+
sub "ट्", "ṭ"
|
|
315
|
+
sub "ठ्", "ṭh"
|
|
316
|
+
sub "ड्", "ḍ"
|
|
317
|
+
sub "ढ्", "ḍh"
|
|
318
|
+
sub "ण्", "ṇ"
|
|
319
|
+
|
|
320
|
+
# Dentals
|
|
321
|
+
sub "त्", "t"
|
|
322
|
+
sub "थ्", "th"
|
|
323
|
+
sub "द्", "d"
|
|
324
|
+
sub "ध्", "dh"
|
|
325
|
+
sub "न्", "n"
|
|
326
|
+
|
|
327
|
+
# Labials
|
|
328
|
+
sub "प्", "p"
|
|
329
|
+
sub "फ्", "ph"
|
|
330
|
+
sub "ब्", "b"
|
|
331
|
+
sub "भ्", "bh"
|
|
332
|
+
sub "म्", "m"
|
|
333
|
+
|
|
334
|
+
# Semivowels
|
|
335
|
+
sub "य्", "y"
|
|
336
|
+
sub "र्", "r"
|
|
337
|
+
sub "ल्", "l"
|
|
338
|
+
sub "व्", "v"
|
|
339
|
+
|
|
340
|
+
# Sibilants
|
|
341
|
+
sub "श्", "sh"
|
|
342
|
+
sub "ष्", "ṣh"
|
|
343
|
+
sub "स्", "s"
|
|
344
|
+
|
|
345
|
+
# Dotted variants
|
|
346
|
+
sub "क़्", "q"
|
|
347
|
+
sub "ख़्", "ḳh"
|
|
348
|
+
sub "ग़्", "ġ"
|
|
349
|
+
sub "ज़्", "z"
|
|
350
|
+
sub "ड़्", "ṙ"
|
|
351
|
+
sub "ढ़्", "ṙh"
|
|
352
|
+
sub "फ़्", "f"
|
|
353
|
+
}
|
|
354
|
+
compose
|
|
355
|
+
}
|
|
356
|
+
|
|
@@ -0,0 +1,214 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: ungegn
|
|
3
|
+
id: 2016
|
|
4
|
+
language: iso-639-2:kan
|
|
5
|
+
source_script: Kana
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
|
|
8
|
+
url: https://www.eki.ee/wgrs/rom1_kn.pdf
|
|
9
|
+
creation_date: 1972
|
|
10
|
+
confirmation_date: 2016
|
|
11
|
+
description: |
|
|
12
|
+
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
|
|
13
|
+
(III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
|
|
14
|
+
published in volume II of the conference reports
|
|
15
|
+
|
|
16
|
+
There is no evidence of the use of the system either in India or in international cartographic
|
|
17
|
+
products.
|
|
18
|
+
|
|
19
|
+
Kannada uses an alphasyllabic script whereby each character represents a syllable rather than
|
|
20
|
+
one sound. Vowels and diphthongs are marked in two ways: as independent characters (used
|
|
21
|
+
syllable-initially) and in an abbreviated form, to denote vowels after consonants. The
|
|
22
|
+
romanization table is unambiguous. The system is mostly reversible but there may exist some
|
|
23
|
+
ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
|
|
24
|
+
consonants (combinations with subscript consonants vs. character sequences).
|
|
25
|
+
|
|
26
|
+
notes:
|
|
27
|
+
- |
|
|
28
|
+
While most consonants have a diacritic in the upper right corner of the character (like ಕ),
|
|
29
|
+
some do not, e.g. ಖ kha, ಜ ja, ನ na, ಬ ba, ಲ la.
|
|
30
|
+
- |
|
|
31
|
+
Combinations with r as the first component are written by adding a special symbol after the
|
|
32
|
+
second consonant: ರ್ಗ rga.
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
tests {
|
|
36
|
+
test "ಕರ್ಣಾಟಕ", "karṇāṭaka"
|
|
37
|
+
test "ಬೆಂಗಳೂರು", "bĕṁgaḷūru"
|
|
38
|
+
test "ಮಹಾರಾಷ್ಟ್ರದ ಯಾವುದೇ ಪ್ರಕರಣದ ತನಿಖೆಗೆ ಇನ್ನು ಸಿಬಿಐ ಪಡೆಯಬೇಕು ಅನುಮತಿ", "mahārāṣhṭrada yāvude prakaraṇada tanikhĕgĕ innu sibiai paḍĕyabeku anumati"
|
|
39
|
+
test "ಹರಕು ಬಾಯಿ: ಈಶ್ವರಪ್ಪಗೆ ಶಾಸಕ ಯತ್ನಾಳ ತಿರುಗೇಟು", "haraku bāyi: īshvarappagĕ shāsaka yatnāḷa tirugeṭu"
|
|
40
|
+
test "ಹಾಥರಸ್ ಪ್ರಕರಣ: ೨೯ರಂದು ರಾಷ್ಟ್ರವ್ಯಾಪಿ ಪ್ರತಿಭಟನೆಗೆ ಮಹಿಳಾ ಸಂಘಟನೆಗಳ ಕರೆ", "hātharas prakaraṇa: 29raṁdu rāṣhṭravyāpi pratibhaṭanĕgĕ mahiḷā saṁghaṭanĕgaḷa karĕ"
|
|
41
|
+
test "ಪೊಲೀಸ್ ಮಕ್ಕಳ ಶಾಲೆ ಮುಚ್ಚುವ ಯತ್ನಕ್ಕೆ ಹೊರಟ್ಟಿ ತೀವ್ರ ವಿರೋಧ", "pŏlīs makkaḷa shālĕ muchchuva yatnakkĕ hŏraṭṭi tīvra virodha"
|
|
42
|
+
test "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ: ಟ್ರಂಪ್–ಬೈಡನ್ ಅಂತಿಮ ಮುಖಾಮುಖಿಗೆ ವೇದಿಕೆ ಸಿದ್ಧ", "amĕrika adhyakṣhīya chunāvaṇĕ: ṭraṁp–baiḍan aṁtima mukhāmukhigĕ vedikĕ siddha"
|
|
43
|
+
test "ಅಂಜನಾದ್ರಿ ಆಂಜನೇಯನ ದರ್ಶನ ಪಡೆದ ಪವರ್ ಸ್ಟಾರ್ ಪುನೀತ್ ರಾಜ್ ಕುಮಾರ್", "aṁjanādri āṁjaneyana darshana paḍĕda pavar sṭār punīt rāj kumār"
|
|
44
|
+
test "ಇನ್ನು ಹಿಂದೂ ದೇವಸ್ಥಾನದ ಧಾರ್ಮಿಕ ಕಾರ್ಯದಲ್ಲಿ ಭಾಗಿಯಾಗಿದ್ದಕ್ಕೆ ಮೋಯಿದ್ದೀನ್ ಬಾವಾಗೆ ಬೆದರಿಕೆ ಒಡ್ಡಲಾಗಿದೆ", "innu hiṁdū devasthānada dhārmika kāryadalli bhāgiyāgiddakkĕ moyiddīn bāvāgĕ bĕdarikĕ ŏḍḍalāgidĕ"
|
|
45
|
+
test "ಇದು ಮೋದಿ ದೇಶ - ದನ ತಿಂದು ಹೋದ್ರೆ ಹುಷಾರ್ : ದೇಗುಲಕ್ಕೆ ಹೋಗಿದ್ದ ಬಾವಾಗೆ ಬೆದರಿಕೆ", "idu modi desha - dana tiṁdu hodrĕ huṣhār : degulakkĕ hogidda bāvāgĕ bĕdarikĕ"
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
aliases {
|
|
49
|
+
def_alias characters_set1, any("\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd")
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
stage {
|
|
53
|
+
|
|
54
|
+
# RULES
|
|
55
|
+
# to cover diacritic and vowel less consonants
|
|
56
|
+
sub "ಕ", "k", after: characters_set1
|
|
57
|
+
sub "ಖ", "kh", after: characters_set1
|
|
58
|
+
sub "ಗ", "g", after: characters_set1
|
|
59
|
+
sub "ಘ", "gh", after: characters_set1
|
|
60
|
+
sub "ಙ", "ṅ", after: characters_set1
|
|
61
|
+
sub "ಚ", "ch", after: characters_set1
|
|
62
|
+
sub "ಛ", "chh", after: characters_set1
|
|
63
|
+
sub "ಜ", "j", after: characters_set1
|
|
64
|
+
sub "ಝ", "jh", after: characters_set1
|
|
65
|
+
sub "ಞ", "ñ", after: characters_set1
|
|
66
|
+
sub "ಟ", "ṭ", after: characters_set1
|
|
67
|
+
sub "ಠ", "ṭh", after: characters_set1
|
|
68
|
+
sub "ಡ", "ḍ", after: characters_set1
|
|
69
|
+
sub "ಢ", "ḍh", after: characters_set1
|
|
70
|
+
sub "ಣ", "ṇ", after: characters_set1
|
|
71
|
+
sub "ತ", "t", after: characters_set1
|
|
72
|
+
sub "ಥ", "th", after: characters_set1
|
|
73
|
+
sub "ದ", "d", after: characters_set1
|
|
74
|
+
sub "ಧ", "dh", after: characters_set1
|
|
75
|
+
sub "ನ", "n", after: characters_set1
|
|
76
|
+
sub "ಪ", "p", after: characters_set1
|
|
77
|
+
sub "ಫ", "ph", after: characters_set1
|
|
78
|
+
sub "ಬ", "b", after: characters_set1
|
|
79
|
+
sub "ಭ", "bh", after: characters_set1
|
|
80
|
+
sub "ಮ", "m", after: characters_set1
|
|
81
|
+
sub "ಯ", "y", after: characters_set1
|
|
82
|
+
sub "ರ", "r", after: characters_set1
|
|
83
|
+
sub "ಲ", "l", after: characters_set1
|
|
84
|
+
sub "ಳ", "ḷ", after: characters_set1
|
|
85
|
+
sub "ವ", "v", after: characters_set1
|
|
86
|
+
sub "ಶ", "sh", after: characters_set1
|
|
87
|
+
sub "ಷ", "ṣh", after: characters_set1
|
|
88
|
+
sub "ಸ", "s", after: characters_set1
|
|
89
|
+
sub "ಹ", "h", after: characters_set1
|
|
90
|
+
|
|
91
|
+
|
|
92
|
+
# CHARACTERS
|
|
93
|
+
parallel {
|
|
94
|
+
sub "ಅ", "a"
|
|
95
|
+
sub "ಆ", "ā"
|
|
96
|
+
sub "ಇ", "i"
|
|
97
|
+
sub "ಈ", "ī"
|
|
98
|
+
sub "ಉ", "u"
|
|
99
|
+
sub "ಊ", "ū"
|
|
100
|
+
sub "ಋ", "ṛ"
|
|
101
|
+
|
|
102
|
+
sub "ಎ", "ĕ"
|
|
103
|
+
sub "ಏ", "e"
|
|
104
|
+
sub "ಐ", "ai"
|
|
105
|
+
|
|
106
|
+
sub "ಒ", "ŏ"
|
|
107
|
+
sub "ಓ", "o"
|
|
108
|
+
sub "ಔ", "au"
|
|
109
|
+
|
|
110
|
+
# Gutturals
|
|
111
|
+
sub "ಕ", "ka"
|
|
112
|
+
sub "ಖ", "kha"
|
|
113
|
+
sub "ಗ", "ga"
|
|
114
|
+
sub "ಘ", "gha"
|
|
115
|
+
sub "ಙ", "ṅa"
|
|
116
|
+
|
|
117
|
+
# Palatals
|
|
118
|
+
sub "ಚ", "cha"
|
|
119
|
+
sub "ಛ", "chha"
|
|
120
|
+
sub "ಜ", "ja"
|
|
121
|
+
sub "ಝ", "jha"
|
|
122
|
+
sub "ಞ", "ña"
|
|
123
|
+
|
|
124
|
+
# Cerebrals
|
|
125
|
+
sub "ಟ", "ṭa"
|
|
126
|
+
sub "ಠ", "ṭha"
|
|
127
|
+
sub "ಡ", "ḍa"
|
|
128
|
+
sub "ಢ", "ḍha"
|
|
129
|
+
sub "ಣ", "ṇa"
|
|
130
|
+
|
|
131
|
+
# Dentals
|
|
132
|
+
sub "ತ", "ta"
|
|
133
|
+
sub "ಥ", "tha"
|
|
134
|
+
sub "ದ", "da"
|
|
135
|
+
sub "ಧ", "dha"
|
|
136
|
+
sub "ನ", "na"
|
|
137
|
+
|
|
138
|
+
# Labials
|
|
139
|
+
sub "ಪ", "pa"
|
|
140
|
+
sub "ಫ", "pha"
|
|
141
|
+
sub "ಬ", "ba"
|
|
142
|
+
sub "ಭ", "bha"
|
|
143
|
+
sub "ಮ", "ma"
|
|
144
|
+
|
|
145
|
+
# Semivowels
|
|
146
|
+
sub "ಯ", "ya"
|
|
147
|
+
sub "ರ", "ra"
|
|
148
|
+
sub "ಲ", "la"
|
|
149
|
+
sub "ಳ", "ḷa"
|
|
150
|
+
|
|
151
|
+
|
|
152
|
+
sub "ವ", "va"
|
|
153
|
+
|
|
154
|
+
# Sibilants
|
|
155
|
+
sub "ಶ", "sha"
|
|
156
|
+
sub "ಷ", "ṣha"
|
|
157
|
+
sub "ಸ", "sa"
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
# Aspirate
|
|
161
|
+
sub "ಹ", "ha"
|
|
162
|
+
|
|
163
|
+
|
|
164
|
+
# Bisarga
|
|
165
|
+
sub "ಃ", "ḥ"
|
|
166
|
+
|
|
167
|
+
# Anusvāra
|
|
168
|
+
sub "ಂ", "ṁ"
|
|
169
|
+
|
|
170
|
+
sub "\u0cbc", "" #nukta
|
|
171
|
+
|
|
172
|
+
# Medials # Needed for connecting constants
|
|
173
|
+
sub "ಾ", "ā"
|
|
174
|
+
sub "ಿ", "i"
|
|
175
|
+
sub "ೀ", "ī"
|
|
176
|
+
sub "ು", "u"
|
|
177
|
+
sub "ೂ", "ū"
|
|
178
|
+
sub "ೃ", "ṛ"
|
|
179
|
+
|
|
180
|
+
|
|
181
|
+
sub "ೆ", "ĕ"
|
|
182
|
+
sub "ೇ", "e"
|
|
183
|
+
sub "ೈ", "ai"
|
|
184
|
+
|
|
185
|
+
|
|
186
|
+
sub "ೊ", "ŏ"
|
|
187
|
+
sub "ೋ", "o"
|
|
188
|
+
sub "ೌ", "au"
|
|
189
|
+
|
|
190
|
+
|
|
191
|
+
sub "्", ""
|
|
192
|
+
sub "़", ""
|
|
193
|
+
sub "್", "" # used for pronounciation without vowel
|
|
194
|
+
sub "", "" # no need for zero with joiner
|
|
195
|
+
sub "", "" # no need for zero with non joiner
|
|
196
|
+
|
|
197
|
+
|
|
198
|
+
|
|
199
|
+
# Digits
|
|
200
|
+
|
|
201
|
+
sub "೦", "0"
|
|
202
|
+
sub "೧", "1"
|
|
203
|
+
sub "೨", "2"
|
|
204
|
+
sub "೩", "3"
|
|
205
|
+
sub "೪", "4"
|
|
206
|
+
sub "೫", "5"
|
|
207
|
+
sub "೬", "6"
|
|
208
|
+
sub "೭", "7"
|
|
209
|
+
sub "೮", "8"
|
|
210
|
+
sub "೯", "9"
|
|
211
|
+
}
|
|
212
|
+
|
|
213
|
+
compose
|
|
214
|
+
}
|