interscript-maps 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
|
@@ -0,0 +1,214 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: ungen
|
|
3
|
+
id: 2017
|
|
4
|
+
language: iso-639-3:prs
|
|
5
|
+
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
|
6
|
+
source_script: Arab
|
|
7
|
+
destination_script: Latn
|
|
8
|
+
name: Persian UN 1967
|
|
9
|
+
url: http://www.eki.ee/wgrs/v2_2/rom1_fa.htm
|
|
10
|
+
creation_date: 1967
|
|
11
|
+
confirmation_date: 01-2003
|
|
12
|
+
description: |
|
|
13
|
+
The United Nations recommended system was approved in 1967 (
|
|
14
|
+
I/13), based on the official system adopted by Iran and
|
|
15
|
+
published in its English version as Transliteration of
|
|
16
|
+
Farsi Geographic Names to Latin Alphabet (September 1966).
|
|
17
|
+
The romanization table was also published as an annex to
|
|
18
|
+
the Toponymic Guidelines for the Islamic Republic of Iran
|
|
19
|
+
in 2000 (Toponymic Guidelines for map and other editors –
|
|
20
|
+
Revised edition 1998. Submitted by the Islamic Republic of
|
|
21
|
+
Iran. UNGEGN, 20th session. New York, 17-28 January 2000,
|
|
22
|
+
Working Paper No. 41.).
|
|
23
|
+
|
|
24
|
+
The system is used in the Islamic Republic of Iran and in
|
|
25
|
+
international cartographic products.
|
|
26
|
+
|
|
27
|
+
Persian (Farsi) uses the Perso-Arabic script that is
|
|
28
|
+
written from right to left. The Persian script usually
|
|
29
|
+
omits vowel points and diacritical marks from writing which
|
|
30
|
+
makes it difficult to obtain uniform results in the
|
|
31
|
+
romanization of Persian. The romanization is generally
|
|
32
|
+
reversible though there are some ambiguous letter
|
|
33
|
+
sequences (kh, sh, th, zh) which also may represent the
|
|
34
|
+
romanized values of two Persian characters in addition to
|
|
35
|
+
the respective single ones.
|
|
36
|
+
|
|
37
|
+
|
|
38
|
+
notes:
|
|
39
|
+
- A Word-initially.
|
|
40
|
+
- B Not romanized; marks absence of the vowel.
|
|
41
|
+
- C Doubling of the consonant letter.
|
|
42
|
+
- D After a consonant (excl. -ah).
|
|
43
|
+
- E After a vowel (see also note 2).
|
|
44
|
+
- 1-The adjectival ending of Arabic origin -يه in Persian is
|
|
45
|
+
romanized -īyeh. In romanizing the definite article the
|
|
46
|
+
same rules of assimilation of consonants are applied as in
|
|
47
|
+
Arabic, e.g. زين الدين Zeyn od Dīn.
|
|
48
|
+
|
|
49
|
+
- 2-The relational suffix (eẕāfeh) -e is usually not
|
|
50
|
+
expressed in Persian writing after a consonant. After final
|
|
51
|
+
ا or و it is written with ى, e.g. پاى آب Pā-ye Āb. After
|
|
52
|
+
final ى and ه it is expressed by writing hamzeh over the
|
|
53
|
+
character دهانۀ ممبر Dahāneh-ye Mambar.
|
|
54
|
+
|
|
55
|
+
- 3-To point Persian vowels two systems are in use that are
|
|
56
|
+
separated by a column in the table. The first system is a
|
|
57
|
+
Persian one while the other adheres to the Arabic
|
|
58
|
+
tradition. In normal spelling vowel points are not used.
|
|
59
|
+
}
|
|
60
|
+
|
|
61
|
+
tests {
|
|
62
|
+
test "اَنجِيرة", "Anjīrah"
|
|
63
|
+
test "اِيْوَانِي", "Eyvānī"
|
|
64
|
+
test "آبَادَان", "Ābādān"
|
|
65
|
+
test "قُرآن", "Qor’ān"
|
|
66
|
+
test "مَآب", "Ma’āb"
|
|
67
|
+
test "مُحَمَّد", "Moḩammad"
|
|
68
|
+
test "كُوهِ مَرغُوب", "Kūh-e Marghūb"
|
|
69
|
+
test "پَايِ آب", "Pā-ye Āb"
|
|
70
|
+
test "جُويِ آس", "Jū-ye Ās"
|
|
71
|
+
test "دَهَانِهٴ مَمبَر", "Dahāneh-ye Mambar"
|
|
72
|
+
test "سَلَسِيٴ بُذُرگ", "Salasī-ye Boz̄org"
|
|
73
|
+
test "ذُو الفَقَار", "Z̄ū ol Faqār"
|
|
74
|
+
}
|
|
75
|
+
|
|
76
|
+
stage {
|
|
77
|
+
# CHARACTERS
|
|
78
|
+
parallel {
|
|
79
|
+
|
|
80
|
+
sub "\u064e", "a" # َ fatha
|
|
81
|
+
sub "\u064e", "", after: "\u0629" # َ fatha followed by ta' marboota
|
|
82
|
+
sub "\u064e", "", after: "a" + any("ht") # َ fatha followed by ta' marboota, handling different order of conversion
|
|
83
|
+
sub "\u0650", "e" # ِ kasra
|
|
84
|
+
sub "\u064f", "o" # ُ damma
|
|
85
|
+
sub "\u0652", "" # ْ sokoon, see Note B
|
|
86
|
+
|
|
87
|
+
sub "\u064e\u0627", "ā" # ـَا fatha followed by ا
|
|
88
|
+
sub "\u064e\u0649", "á" # ـَى fatha followed by ى which is ا not ي
|
|
89
|
+
sub boundary + "\u0622", "ā" # آ NOTE A
|
|
90
|
+
sub "\u0622", "’ā" # آ
|
|
91
|
+
sub "\u0650\u064a", "ī" # ـِي kasra followed by ي
|
|
92
|
+
sub "\u064f\u0648", "ū" # ـُو damma followed by و
|
|
93
|
+
sub any("\u064e\u0650") + "\u064a\u0652", "ey" # ـَيْ
|
|
94
|
+
sub any("\u064e\u064f") + "\u0648\u0652", "ow" # ـَوْ
|
|
95
|
+
sub "\u0621", "’" # ء
|
|
96
|
+
sub "\u2013", "–"
|
|
97
|
+
sub "\u2013" + any("\u0649\u064a") + "\u0647", "-īyeh"
|
|
98
|
+
sub any("\u0654\u0674"), "-e" # ٴ ezafeh
|
|
99
|
+
sub any("\u0654\u0674"), "-ye", before: any("\u064a\u0647") # ٴ ezafeh
|
|
100
|
+
sub "\u0650" + boundary, "-e" # ِ kasra
|
|
101
|
+
sub any("\u064a\u06cc") + "\u0650" + boundary, "-ye" # ِ kasra
|
|
102
|
+
|
|
103
|
+
# NOTE C
|
|
104
|
+
sub "\u0628\u0651", "bb" # ب
|
|
105
|
+
sub "\u062a\u0651", "tt" # ت
|
|
106
|
+
sub "\u062b\u0651", "s̄s̄" # ث
|
|
107
|
+
sub "\u062c\u0651", "jj" # ج
|
|
108
|
+
sub "\u062d\u0651", "ḩḩ" # ح
|
|
109
|
+
sub "\u062e\u0651", "kh" # خ
|
|
110
|
+
sub "\u062f\u0651", "dd" # د
|
|
111
|
+
sub "\u0630\u0651", "z̄z̄" # ذ
|
|
112
|
+
sub "\u0631\u0651", "rr" # ر
|
|
113
|
+
sub "\u0632\u0651", "zz" # ز
|
|
114
|
+
sub "\u0633\u0651", "ss" # س
|
|
115
|
+
sub "\u0634\u0651", "sh" # ش
|
|
116
|
+
sub "\u0635\u0651", "şş" # ص
|
|
117
|
+
sub "\u0636\u0651", "ẕẕ" # ض
|
|
118
|
+
sub "\u0637\u0651", "ţţ" # ط
|
|
119
|
+
sub "\u0638\u0651", "z̧z̧" # ظ
|
|
120
|
+
sub "\u063a\u0651", "gh" # غ
|
|
121
|
+
sub "\u0641\u0651", "ff" # ف
|
|
122
|
+
sub "\u0642\u0651", "qq" # ق
|
|
123
|
+
sub "\u0643\u0651", "kk" # ك
|
|
124
|
+
sub "\u0644\u0651", "ll" # ل
|
|
125
|
+
sub "\u0645\u0651", "mm" # م
|
|
126
|
+
sub "\u0646\u0651", "nn" # ن
|
|
127
|
+
sub "\u0647\u0651", "hh" # ه
|
|
128
|
+
sub "\u0648\u0651", "vv" # و
|
|
129
|
+
sub "\u064a\u0651", "yy" # ي
|
|
130
|
+
|
|
131
|
+
# NOTE 1
|
|
132
|
+
# Sun letters
|
|
133
|
+
sub boundary + "\u0627\u0644\u062a", "ot t" # الت
|
|
134
|
+
sub boundary + "\u0627\u0644\u062b", "os̄ s̄" # الث
|
|
135
|
+
sub boundary + "\u0627\u0644\u062f", "od d" # الد
|
|
136
|
+
sub boundary + "\u0627\u0644\u0630", "oz̄ z̄" # الذ
|
|
137
|
+
sub boundary + "\u0627\u0644\u0631", "or r" # الر
|
|
138
|
+
sub boundary + "\u0627\u0644\u0632", "oz z" # الز
|
|
139
|
+
sub boundary + "\u0627\u0644\u0633", "os s" # الس
|
|
140
|
+
sub boundary + "\u0627\u0644\u0634", "osh sh" # الش
|
|
141
|
+
sub boundary + "\u0627\u0644\u0635", "oş ş" # الص
|
|
142
|
+
sub boundary + "\u0627\u0644\u0636", "oẕ ẕ" # الض
|
|
143
|
+
sub boundary + "\u0627\u0644\u0637", "oţ ţ" # الط
|
|
144
|
+
sub boundary + "\u0627\u0644\u0638", "oz̧ z̧" # الظ
|
|
145
|
+
sub boundary + "\u0627\u0644\u0644", "ol l" # الل
|
|
146
|
+
sub boundary + "\u0627\u0644\u0646", "on n" # الن
|
|
147
|
+
|
|
148
|
+
sub "\u0650\u064a\u0651", "īy" # ـِيَّ
|
|
149
|
+
sub "\u0650\u064a", "iy", after: any("\u064e\u064f") # ـِي kasra followed by ي
|
|
150
|
+
|
|
151
|
+
# ta' marboota
|
|
152
|
+
sub "\u0629", "at" # ة in the middle of the sentence
|
|
153
|
+
sub "\u0629" + line_end, "ah"
|
|
154
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
155
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
156
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
157
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
158
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
159
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
160
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
161
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
162
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
163
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
164
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
165
|
+
sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
|
|
166
|
+
|
|
167
|
+
sub boundary + "\u0627\u0644", "al " # ال
|
|
168
|
+
sub space + boundary + "\u0627\u0644", " ol " # ال #special Rule 1
|
|
169
|
+
|
|
170
|
+
sub boundary + "\u0627", "" # ا initial
|
|
171
|
+
sub "\u0627", "ā" # ا middial
|
|
172
|
+
sub "\u0627" + boundary, "ā" # ا final
|
|
173
|
+
|
|
174
|
+
sub "\u0628", "b" # ب
|
|
175
|
+
sub "\u067E", "p" # پ
|
|
176
|
+
sub "\u062A", "t" # ت
|
|
177
|
+
sub "\u062B", "s̄" # ث
|
|
178
|
+
sub "\u062C", "j" # ج
|
|
179
|
+
sub "\u0686", "ch" # چ
|
|
180
|
+
sub "\u062D", "ḩ" # ح
|
|
181
|
+
sub "\u062E", "kh" # خ
|
|
182
|
+
sub "\u062F", "d" # د
|
|
183
|
+
sub "\u0630", "z̄" # ذ
|
|
184
|
+
sub "\u0631", "r" # ر
|
|
185
|
+
sub "\u0632", "z" # ز
|
|
186
|
+
sub "\u0698", "zh" # ژ
|
|
187
|
+
sub "\u0633", "s" # س
|
|
188
|
+
sub "\u0634", "sh" # ش
|
|
189
|
+
sub "\u0635", "ş" # ص
|
|
190
|
+
sub "\u0636", "ẕ" # ض
|
|
191
|
+
sub "\u0637", "ţ" # ط
|
|
192
|
+
sub "\u0638", "z̧" # ظ
|
|
193
|
+
sub "\u0639", "’" # ع
|
|
194
|
+
sub "\u063A", "gh" # غ
|
|
195
|
+
sub "\u0641", "f" # ف
|
|
196
|
+
sub "\u0642", "q" # ق
|
|
197
|
+
sub "\u0643", "k" # ك
|
|
198
|
+
sub "\u06A9", "k" # ک
|
|
199
|
+
sub "\u06AF", "g" # گ
|
|
200
|
+
sub "\u0644", "l" # ل
|
|
201
|
+
sub "\u0645", "m" # م
|
|
202
|
+
sub "\u0646", "n" # ن
|
|
203
|
+
sub "\u0648", "v" # و
|
|
204
|
+
sub "\u0647", "h" # ه
|
|
205
|
+
sub "\u0649", "y" # ي
|
|
206
|
+
sub "\u064a", "y" # ي
|
|
207
|
+
}
|
|
208
|
+
|
|
209
|
+
# POSTRULES
|
|
210
|
+
sub any("\u0061".."\uFFFF"), upcase, before: boundary, not_before: boundary + any("‘’'-")
|
|
211
|
+
|
|
212
|
+
sub " Al", " al"
|
|
213
|
+
sub " Ol", " ol"
|
|
214
|
+
}
|
|
@@ -0,0 +1,96 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: ungegn
|
|
3
|
+
id: 1987
|
|
4
|
+
language: iso-639-2:rus
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Russian Romanization system
|
|
8
|
+
url: http://www.eki.ee/wgrs/rom1_ru.htm
|
|
9
|
+
creation_date: 1987
|
|
10
|
+
confirmation_date: 2016
|
|
11
|
+
description: |
|
|
12
|
+
The United Nations recommended system was approved in 1987 (V/18),
|
|
13
|
+
based on the official system of the Main Administration of Geodesy and
|
|
14
|
+
Cartography of the former Soviet Union, also known as the GOST 1983
|
|
15
|
+
system (GOST 16876-71). The table was published as an annex to the
|
|
16
|
+
resolution.
|
|
17
|
+
|
|
18
|
+
The system is used in the Russian Federation and increasingly in
|
|
19
|
+
international cartographic products.
|
|
20
|
+
|
|
21
|
+
Russian uses the Cyrillic script which is alphabetic. The
|
|
22
|
+
romanization table is unambiguous and can be applied automatically. The
|
|
23
|
+
system is reversible, although rarely there can be ambiguities.
|
|
24
|
+
|
|
25
|
+
notes:
|
|
26
|
+
- "Cursive forms of some characters might be formed differently: Аа Бб
|
|
27
|
+
Вв Гг Дд Ее Ёё Жж Зз Ии Йй Кк Лл Мм Нн Оо Пп Рр Сс Тт Уу Фф Хх Цц Чч Шш
|
|
28
|
+
Щщ Ъъ Ыы Ьь Ээ Юю Яя."
|
|
29
|
+
|
|
30
|
+
- Fifth United Nations Conference on the Standardization of
|
|
31
|
+
Geographical Names. Montreal, 18–31 August 1987. Vol. I. Report of the
|
|
32
|
+
Conference, pp. 40–41.
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
tests {
|
|
36
|
+
test "Aнaпa", "Anapa"
|
|
37
|
+
test "Бaбушкин", "Babuškin"
|
|
38
|
+
test "Вaвилово", "Vavilovo"
|
|
39
|
+
test "Гaгaрин", "Gagarin"
|
|
40
|
+
test "Дудинкa", "Dudinka"
|
|
41
|
+
test "Елисeeвкa", "Eliseevka"
|
|
42
|
+
test "Ёлкино", "Ëlkino"
|
|
43
|
+
test "Псëл", "Psël"
|
|
44
|
+
test "Жужa", "Žuža"
|
|
45
|
+
test "Звëздный", "Zvëzdnyj"
|
|
46
|
+
test "Идрицa", "Idrica"
|
|
47
|
+
test "Зaрaйск", "Zarajsk"
|
|
48
|
+
test "Кокaнд", "Kokand"
|
|
49
|
+
test "Лaлвaр", "Lalvar"
|
|
50
|
+
test "Мaймaк", "Majmak"
|
|
51
|
+
test "Нeжин", "Nežin"
|
|
52
|
+
test "Обoдoвкa", "Obodovka"
|
|
53
|
+
test "Пaп", "Pap"
|
|
54
|
+
test "Рeбрихa", "Rebriha"
|
|
55
|
+
test "Сaсoвo", "Sasovo"
|
|
56
|
+
test "Тaттa", "Tatta"
|
|
57
|
+
test "Уржум", "Uržum"
|
|
58
|
+
test "Фoфaнoвo", "Fofanovo"
|
|
59
|
+
test "Хoхломa", "Hohloma"
|
|
60
|
+
test "Цвeткoвo", "Cvetkovo"
|
|
61
|
+
test "Чeчeльник", "Čečel’nik"
|
|
62
|
+
test "Шишкинo", "Šiškino"
|
|
63
|
+
test "Щукинo", "Ščukino"
|
|
64
|
+
test "Пoдъячeвo", "Pod”jačevo"
|
|
65
|
+
test "Ыныкчaнский", "Ynykčanskij"
|
|
66
|
+
test "Пaрaньгa", "Paran’ga"
|
|
67
|
+
test "Кaзaнь", "Kazan’"
|
|
68
|
+
test "Щучьe", "Ščuč’e"
|
|
69
|
+
test "Элистa", "Èlista"
|
|
70
|
+
test "Юринo", "Jurino"
|
|
71
|
+
test "Юхнoв", "Juhnov"
|
|
72
|
+
test "Юрюзaнь", "Jurjuzan’"
|
|
73
|
+
test "Ямaл", "Jamal"
|
|
74
|
+
test "Язъявaн", "Jaz”javan"
|
|
75
|
+
test "Яя", "Jaja"
|
|
76
|
+
test "Вязьмa", "Vjaz’ma"
|
|
77
|
+
}
|
|
78
|
+
|
|
79
|
+
dependency "gost-rus-Cyrl-Latn-16876-71-1983", as: cyrllatn
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
stage {
|
|
83
|
+
# CHARACTERS
|
|
84
|
+
parallel {
|
|
85
|
+
sub "\u042A", "”" # Ъ
|
|
86
|
+
sub "\u042C", "’" # Ь
|
|
87
|
+
sub "\u044A", "”" # ъ
|
|
88
|
+
sub "\u044C", "’" # ь
|
|
89
|
+
sub "\u042E", "Ju" # Ю
|
|
90
|
+
sub "\u044E", "ju" # ю
|
|
91
|
+
sub "\u042F", "Ja" # Я
|
|
92
|
+
sub "\u044F", "ja" # я
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
run map.cyrllatn.stage.main
|
|
96
|
+
}
|
|
@@ -0,0 +1,193 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: un
|
|
3
|
+
id: 1972
|
|
4
|
+
language: iso-639-2:sin
|
|
5
|
+
source_script: Sinh
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Sinhalese Romanization Version 4.0
|
|
8
|
+
url: https://www.eki.ee/wgrs/rom1_ml.htm
|
|
9
|
+
creation_date: 1972
|
|
10
|
+
confirmation_date: 2016
|
|
11
|
+
description: |
|
|
12
|
+
There does not seem to exist any national systems of romanization for Sinhalese (Sinhala) in Sri Lanka.
|
|
13
|
+
|
|
14
|
+
In 1972, D. N. Sharma prepared a romanization table for Sinhalese (Sinhala) which was published in vol. II
|
|
15
|
+
of the conference report together with the other languages of the Indian group1.
|
|
16
|
+
|
|
17
|
+
Sinhalese uses an alphasyllabic script whereby each character represents a syllable rather than one sound.
|
|
18
|
+
Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
|
|
19
|
+
abbreviated form, to denote vowels after consonants.
|
|
20
|
+
|
|
21
|
+
|
|
22
|
+
notes:
|
|
23
|
+
- |
|
|
24
|
+
The character ඇ was romanized as a͝i and the character ඈ as ai in Sharma's table, but there was no romanization for the character ඓ which,
|
|
25
|
+
though rarely used, represents the ai proper of the Indian languages; here the romanization of these characters is given in accordance with the pronunciation.
|
|
26
|
+
- |
|
|
27
|
+
ැ ෑ Exceptions: රැ ræ̆, රෑ ræ.
|
|
28
|
+
- |
|
|
29
|
+
ු Exceptions: කූ kū, ගූ gū, තූ tū, භූ bhū, රූ rū, ශූ shū.
|
|
30
|
+
- |
|
|
31
|
+
ූ Exceptions: කූ kū, ගූ gū, තූ tū, භූ bhū, රූ rū, ශූ shū
|
|
32
|
+
- |
|
|
33
|
+
් Marks absence of the inherent vowel. Special forms: ඛ් kh, ඞ් ṅ, ච් ch, ට් ṭ, ඩ් ḍ, ධ් dh, බ් b, ම් m, ව් v.
|
|
34
|
+
- |
|
|
35
|
+
ඛ ඝ ඞ ච ඡ ඣ ඤ ඨ ඪ ථ ධ ඵ භ ශ ෂ These consonants are used only in Sanskrit and Pali loanwords.
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
tests {
|
|
39
|
+
test "ශී්ර ලංකාවේ කී්රඩාව ඉතිහාසයේ ඉහළම තැනකට ගේන්න කටයුතු කරනවා", "shīra laṁkāve kīraḍāva itihāsaye ihaḷama tæ̆nakaṭa genna kaṭayutu karanavā"
|
|
40
|
+
test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaඬe moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
|
|
41
|
+
test "ලෝක ළමා දිනයදා සිසුන් පිරිසක් කසිප්පු බීලා", "loka ḷamā dinayadā sisun pirisak kasippu bīlā"
|
|
42
|
+
test "කෝටි 16ක හෙරොයින් සමග දන්කොටුවේදී 7ක් දැලේ", "koṭi 16ka hĕrŏyin samaga dankŏṭuvedī 7k dæ̆le"
|
|
43
|
+
test "මිනුවන්ගොඩ පීසීආර් දෙදහසක් සිදුකරයි", "minuvangŏḍa pīsīār dĕdahasak sidukarayi"
|
|
44
|
+
test "පාස්කු ප්රහාරය වගේම පාස්කු ප්රෝඩාව ගැනත් සොයන්න කොමිසමක් පත්කළ යුතුයි - විපක්ෂ නායක සජිත් පේ්රමදාස", "pāsku parahāraya vagema pāsku proḍāva gæ̆nat sŏyanna kŏmisamak patkaḷa yutuyi - vipakṣha nāyaka sajit peramadāsa"
|
|
45
|
+
test "ට්රම්ප්ගේ සෞඛ්යය තීරණාත්මකයි - ට්විටර් හරහා ජනතාව අමතයි", "ṭarampge saukhyaya tīraṇātmakayi - ṭviṭar harahā janatāva amatayi"
|
|
46
|
+
test "පාස්කු දා ප්රහාරය පිළිබඳ පරීක්ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibaඳ parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
|
|
47
|
+
test "දිල්ලි කැපිටල්ස් සහ කෝලිගේ බැංගලෝර් තෙවැනි ජය ලබයි", "dilli kæ̆piṭals saha kolige bæ̆ṁgalor tĕvæ̆ni jaya labayi"
|
|
48
|
+
test "ශ්රී ලාංකික සම්භවයක් සහිත ප්රංශයේ පවුලක 5 ක් ඝාතනය කරලා", "sharī lāṁkika sambhavayak sahita paraṁshaye pavulaka 5 k ghātanaya karalā"
|
|
49
|
+
test "පැතිකුදය ඉක්මනින් සුව කරන ප්රතිකාර", "pæ̆tikudaya ikmanin suva karana paratikāra"
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
aliases {
|
|
53
|
+
def_alias sinh_chars_1, any("\u0dcf\u0dd0\u0dd1\u0dd2\u0dd3\u0dd4\u0dd6\u0dd8\u0df2\u0dd9\u0dda\u0ddb\u0ddc\u0ddd\u0dde\u0dca")
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
stage {
|
|
57
|
+
|
|
58
|
+
# RULES
|
|
59
|
+
sub "ක", "k", after: sinh_chars_1
|
|
60
|
+
sub "ඛ", "kh", after: sinh_chars_1
|
|
61
|
+
sub "ග", "g", after: sinh_chars_1
|
|
62
|
+
sub "ඝ", "gh", after: sinh_chars_1
|
|
63
|
+
sub "ඞ", "ṅ", after: sinh_chars_1
|
|
64
|
+
sub "ච", "ch", after: sinh_chars_1
|
|
65
|
+
sub "ඡ", "chh", after: sinh_chars_1
|
|
66
|
+
sub "ජ", "j", after: sinh_chars_1
|
|
67
|
+
sub "ඣ", "jh", after: sinh_chars_1
|
|
68
|
+
sub "ඤ", "ñ", after: sinh_chars_1
|
|
69
|
+
sub "ට", "ṭ", after: sinh_chars_1
|
|
70
|
+
sub "ඨ", "ṭh", after: sinh_chars_1
|
|
71
|
+
sub "ඩ", "ḍ", after: sinh_chars_1
|
|
72
|
+
sub "ඪ", "ḍh", after: sinh_chars_1
|
|
73
|
+
sub "ණ", "ṇ", after: sinh_chars_1
|
|
74
|
+
sub "ත", "t", after: sinh_chars_1
|
|
75
|
+
sub "ථ", "th", after: sinh_chars_1
|
|
76
|
+
sub "ද", "d", after: sinh_chars_1
|
|
77
|
+
sub "ධ", "dh", after: sinh_chars_1
|
|
78
|
+
sub "න", "n", after: sinh_chars_1
|
|
79
|
+
sub "ප", "p", after: sinh_chars_1
|
|
80
|
+
sub "ඵ", "ph", after: sinh_chars_1
|
|
81
|
+
sub "බ", "b", after: sinh_chars_1
|
|
82
|
+
sub "භ", "bh", after: sinh_chars_1
|
|
83
|
+
sub "ම", "m", after: sinh_chars_1
|
|
84
|
+
sub "ය", "y", after: sinh_chars_1
|
|
85
|
+
sub "ර", "r", after: sinh_chars_1
|
|
86
|
+
sub "ල", "l", after: sinh_chars_1
|
|
87
|
+
sub "ව", "v", after: sinh_chars_1
|
|
88
|
+
sub "ශ", "sh", after: sinh_chars_1
|
|
89
|
+
sub "ෂ", "ṣh", after: sinh_chars_1
|
|
90
|
+
sub "ස", "s", after: sinh_chars_1
|
|
91
|
+
sub "හ", "h", after: sinh_chars_1
|
|
92
|
+
sub "ෆ", "f", after: sinh_chars_1
|
|
93
|
+
sub "ළ", "ḷ", after: sinh_chars_1
|
|
94
|
+
|
|
95
|
+
|
|
96
|
+
# CHARACTERS
|
|
97
|
+
parallel {
|
|
98
|
+
# I. Independent vowel characters
|
|
99
|
+
sub "අ", "a"
|
|
100
|
+
sub "ආ", "ā"
|
|
101
|
+
sub "ඇ", "æ̆"
|
|
102
|
+
sub "ඈ", "æ"
|
|
103
|
+
sub "ඉ", "i"
|
|
104
|
+
sub "ඊ", "ī"
|
|
105
|
+
sub "උ", "u"
|
|
106
|
+
sub "ඌ", "ū"
|
|
107
|
+
sub "ඍ", "ṛ"
|
|
108
|
+
sub "ඎ", "ṝ"
|
|
109
|
+
sub "එ", "ĕ"
|
|
110
|
+
sub "ඒ", "e"
|
|
111
|
+
sub "ඓ", "ai"
|
|
112
|
+
sub "ඔ", "ŏ"
|
|
113
|
+
sub "ඕ", "o"
|
|
114
|
+
sub "ඖ", "au"
|
|
115
|
+
|
|
116
|
+
# II. Abbreviated vowel characters and other symbols
|
|
117
|
+
sub "ා", "ā"
|
|
118
|
+
sub "ැ", "æ̆"
|
|
119
|
+
sub "ෑ", "æ"
|
|
120
|
+
sub "ි", "i"
|
|
121
|
+
sub "ී", "ī"
|
|
122
|
+
sub "ු", "u"
|
|
123
|
+
sub "ූ", "ū"
|
|
124
|
+
sub "ෘ", "ṛ"
|
|
125
|
+
sub "ෲ", "ṝ"
|
|
126
|
+
sub "ෙ", "ĕ"
|
|
127
|
+
sub "ේ", "e"
|
|
128
|
+
sub "ෛ", "ai"
|
|
129
|
+
sub "ො", "ŏ"
|
|
130
|
+
sub "ෝ", "o"
|
|
131
|
+
sub "ෞ", "au"
|
|
132
|
+
sub "ඃ", "ḥ"
|
|
133
|
+
sub "ං", "ṁ"
|
|
134
|
+
sub "්", ""
|
|
135
|
+
|
|
136
|
+
|
|
137
|
+
# III. Consonant characters
|
|
138
|
+
sub "ක", "ka"
|
|
139
|
+
sub "ඛ", "kha"
|
|
140
|
+
sub "ග", "ga"
|
|
141
|
+
sub "ඝ", "gha"
|
|
142
|
+
sub "ඞ", "ṅa"
|
|
143
|
+
sub "ච", "cha"
|
|
144
|
+
sub "ඡ", "chha"
|
|
145
|
+
sub "ජ", "ja"
|
|
146
|
+
sub "ඣ", "jha"
|
|
147
|
+
sub "ඤ", "ña"
|
|
148
|
+
sub "ට", "ṭa"
|
|
149
|
+
sub "ඨ", "ṭha"
|
|
150
|
+
sub "ඩ", "ḍa"
|
|
151
|
+
sub "ඪ", "ḍha"
|
|
152
|
+
sub "ණ", "ṇa"
|
|
153
|
+
sub "ත", "ta"
|
|
154
|
+
sub "ථ", "tha"
|
|
155
|
+
sub "ද", "da"
|
|
156
|
+
sub "ධ", "dha"
|
|
157
|
+
sub "න", "na"
|
|
158
|
+
sub "ප", "pa"
|
|
159
|
+
sub "ඵ", "pha"
|
|
160
|
+
sub "බ", "ba"
|
|
161
|
+
sub "භ", "bha"
|
|
162
|
+
sub "ම", "ma"
|
|
163
|
+
sub "ය", "ya"
|
|
164
|
+
sub "ර", "ra"
|
|
165
|
+
sub "ල", "la"
|
|
166
|
+
sub "ව", "va"
|
|
167
|
+
sub "ශ", "sha"
|
|
168
|
+
sub "ෂ", "ṣha"
|
|
169
|
+
sub "ස", "sa"
|
|
170
|
+
sub "හ", "ha"
|
|
171
|
+
sub "ෆ", "fa"
|
|
172
|
+
sub "ළ", "ḷa"
|
|
173
|
+
|
|
174
|
+
# numbers
|
|
175
|
+
sub "\u0DE6", "0"
|
|
176
|
+
sub "\u0DE7", "1"
|
|
177
|
+
sub "\u0DE8", "2"
|
|
178
|
+
sub "\u0DE9", "3"
|
|
179
|
+
sub "\u0DEA", "4"
|
|
180
|
+
sub "\u0DEB", "5"
|
|
181
|
+
sub "\u0DEC", "6"
|
|
182
|
+
sub "\u0DED", "7"
|
|
183
|
+
sub "\u0DEE", "8"
|
|
184
|
+
sub "\u0DEF", "9"
|
|
185
|
+
|
|
186
|
+
|
|
187
|
+
sub "", "" # Used for joining
|
|
188
|
+
sub "", "" # Used for non joining
|
|
189
|
+
}
|
|
190
|
+
|
|
191
|
+
compose
|
|
192
|
+
}
|
|
193
|
+
|