interscript-maps 2.0.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
@@ -0,0 +1,101 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:aze
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: ALA-LC Romanization Table -- Azerbaijani (1997)
|
8
|
+
url: https://transliteration.eki.ee/pdf/Azerbaijani.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization Tables: Transliteration Schemes for Non-Roman Scripts. Randal K. Berry (ed.). Library of Congress, 1997.
|
12
|
+
|
13
|
+
notes:
|
14
|
+
- "Ј ј replaced Й й in 1959 (Roman: y; ISO 9: j; ALA-LC: ĭ)."
|
15
|
+
}
|
16
|
+
|
17
|
+
tests {
|
18
|
+
# from internet
|
19
|
+
test "Азәрбајҹан дили", "Azărbaı̐jan dili"
|
20
|
+
test "Бүтүн инсанлар ләјагәт вә һүгугларына ҝөрә азад вә бәрабәр доғулурлар.\nОнларын шүурлары вә виҹданлары вар вә бир-бирләринә мүнасибәтдә гардашлыг руһунда давранмалыдырлар.", "Bu̇tu̇n insanlar lăı̐agăt vă ḣu̇guglaryna ġȯră azad vă bărabăr doghulurlar.\nOnlaryn shu̇urlary vă vijdanlary var vă bir-birlărină mu̇nasibătdă gardashlyg ruḣunda davranmalydyrlar."
|
21
|
+
test "Азәрбајҹан! Азәрбајҹан!\nЕј гәһрәман өвладын шанлы Вәтәни!\nСәндән өтрү ҹан вермәјә ҹүмлә һазырыз!\nСәндән өтрү ган төкмәјә ҹүмлә гадириз!\nҮчрәнҝли бајрағынла мәсуд јаша!\nҮчрәнҝли бајрағынла мәсуд јаша!\nМинләрлә ҹан гурбан олду,\nСинән һәрбә мејдан олду!\nҺүгугундан кечән әсҝәр,\nҺәрә бир гәһрәман олду!\nСән оласан ҝүлүстан,\nСәнә һәр ан ҹан гурбан!\nСәнә мин бир мәһәббәт\nСинәмдә тутмуш мәкан!\nНамусуну һифз етмәјә,\nБајрағыны јүксәлтмәјә\nНамусуну һифз етмәјә,\nҸүмлә ҝәнҹләр мүштагдыр!\nШанлы Вәтән! Шанлы Вәтән!\nАзәрбајҹан! Азәрбајҹан!\nАзәрбајҹан! Азәрбајҹан!", "Azărbaı̐jan! Azărbaı̐jan!\nEı̐ găḣrăman ȯvladyn shanly Vătăni!\nSăndăn ȯtru̇ jan vermăı̐ă ju̇mlă ḣazyryz!\nSăndăn ȯtru̇ gan tȯkmăı̐ă ju̇mlă gadiriz!\nU̇chrănġli baı̐raghynla măsud ı̐asha!\nU̇chrănġli baı̐raghynla măsud ı̐asha!\nMinlărlă jan gurban oldu,\nSinăn ḣărbă meı̐dan oldu!\nḢu̇gugundan kechăn ăsġăr,\nḢără bir găḣrăman oldu!\nSăn olasan ġu̇lu̇stan,\nSănă ḣăr an jan gurban!\nSănă min bir măḣăbbăt\nSinămdă tutmush măkan!\nNamusunu ḣifz etmăı̐ă,\nBaı̐raghyny ı̐u̇ksăltmăı̐ă\nNamusunu ḣifz etmăı̐ă,\nJu̇mlă ġănjlăr mu̇shtagdyr!\nShanly Vătăn! Shanly Vătăn!\nAzărbaı̐jan! Azărbaı̐jan!\nAzărbaı̐jan! Azărbaı̐jan!"
|
22
|
+
}
|
23
|
+
|
24
|
+
stage {
|
25
|
+
|
26
|
+
# CHARACTERS
|
27
|
+
parallel {
|
28
|
+
sub "\u0410", "A" # А
|
29
|
+
sub "\u0411", "B" # Б
|
30
|
+
sub "\u0412", "V" # В
|
31
|
+
sub "\u0413", "G" # Г
|
32
|
+
sub "\u0492", "Gh" # Ғ
|
33
|
+
sub "\u0414", "D" # Д
|
34
|
+
sub "\u0415", "E" # Е
|
35
|
+
sub "\u04D8", "Ă" # Ә
|
36
|
+
sub "\u0416", "Zh" # Ж
|
37
|
+
sub "\u0417", "Z" # З
|
38
|
+
sub "\u0418", "I" # И
|
39
|
+
sub "\u042B", "Y" # Ы
|
40
|
+
sub "\u0408", "I̐" # Ј
|
41
|
+
sub "\u0419", "Y" # Й note[1]
|
42
|
+
sub "\u0419", "Y" # Й
|
43
|
+
sub "\u041A", "K" # К
|
44
|
+
sub "\u049C", "Ġ" # Ҝ
|
45
|
+
sub "\u041B", "L" # Л
|
46
|
+
sub "\u041C", "M" # М
|
47
|
+
sub "\u041D", "N" # Н
|
48
|
+
sub "\u041E", "O" # О
|
49
|
+
sub "\u04E8", "Ȯ" # Ө
|
50
|
+
sub "\u041F", "P" # П
|
51
|
+
sub "\u0420", "R" # Р
|
52
|
+
sub "\u0421", "S" # С
|
53
|
+
sub "\u0422", "T" # Т
|
54
|
+
sub "\u0423", "U" # У
|
55
|
+
sub "\u04AE", "U̇" # Ү
|
56
|
+
sub "\u0424", "F" # Ф
|
57
|
+
sub "\u0425", "Kh" # Х
|
58
|
+
sub "\u04BA", "Ḣ" # Һ
|
59
|
+
sub "\u0427", "Ch" # Ч
|
60
|
+
sub "\u04B8", "J" # Ҹ
|
61
|
+
sub "\u0428", "Sh" # Ш
|
62
|
+
|
63
|
+
sub "\u0430", "a" # а
|
64
|
+
sub "\u0431", "b" # б
|
65
|
+
sub "\u0432", "v" # в
|
66
|
+
sub "\u0433", "g" # г
|
67
|
+
sub "\u0493", "gh" # ғ
|
68
|
+
sub "\u0434", "d" # д
|
69
|
+
sub "\u0435", "e" # e
|
70
|
+
sub "\u04D9", "ă" # ә
|
71
|
+
sub "\u0436", "zh" # ж
|
72
|
+
sub "\u0437", "z" # з
|
73
|
+
sub "\u0438", "i" # и
|
74
|
+
sub "\u044B", "y" # ы
|
75
|
+
sub "\u0458", "ı̐" # ј
|
76
|
+
sub "\u0439", "y" # й note[1]
|
77
|
+
sub "\u043A", "k" # к
|
78
|
+
sub "\u049D", "ġ" # ҝ
|
79
|
+
sub "\u043B", "l" # л
|
80
|
+
sub "\u043C", "m" # м
|
81
|
+
sub "\u043D", "n" # н
|
82
|
+
sub "\u043E", "o" # о
|
83
|
+
sub "\u04E9", "ȯ" # ө
|
84
|
+
sub "\u043F", "p" # п
|
85
|
+
sub "\u0440", "r" # р
|
86
|
+
sub "\u0441", "s" # с
|
87
|
+
sub "\u0442", "t" # т
|
88
|
+
sub "\u0443", "u" # у
|
89
|
+
sub "\u04AF", "u̇" # ү
|
90
|
+
sub "\u0444", "f" # ф
|
91
|
+
sub "\u0445", "kh" # х
|
92
|
+
sub "\u04BB", "ḣ" # һ
|
93
|
+
sub "\u0447", "ch" # ч
|
94
|
+
sub "\u04B9", "j" # ҹ
|
95
|
+
sub "\u0448", "sh" # ш
|
96
|
+
|
97
|
+
sub "\u2019", "\u2019"
|
98
|
+
}
|
99
|
+
|
100
|
+
compose
|
101
|
+
}
|
@@ -0,0 +1,118 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:bel
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: ALA-LC Romanization Table -- Byelorussian (1997)
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/beloruss.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
|
11
|
+
notes:
|
12
|
+
- Ґ letter found in Old Belarusian and in modern publications in Tarashkevitsa orthography.
|
13
|
+
- Do not confuse with the digraph кг (also romanized as “kh”). Manual review may be needed when transcribing data in vernacular characters in order to distinguish х from кг.
|
14
|
+
- The apostrophe (´) is not transliterated.
|
15
|
+
- Soft sign (prime) is USMARC hexadecimal code A7 ~ U+02B9 Unicode character
|
16
|
+
}
|
17
|
+
|
18
|
+
tests {
|
19
|
+
# https://en.wikipedia.org/wiki/Romanization_of_Belarusian#Examples
|
20
|
+
# https://img.tyt.by/n/02/d/belorusskiy_translit.jpg - with issues
|
21
|
+
test "Беларусь", "Belarusʹ"
|
22
|
+
test "Магілёў", "Mahili͡oŭ"
|
23
|
+
test "Лукашэнка", "Lukashėnka"
|
24
|
+
test "сям´я", "si͡ami͡a"
|
25
|
+
test "Уручча", "Uruchcha"
|
26
|
+
test "Барысаўскі тракт", "Barysaŭski trakt"
|
27
|
+
test "Усход", "Uskhod"
|
28
|
+
test "Маскоўская", "Maskoŭskai͡a"
|
29
|
+
test "Парк Чалюскінцаў", "Park Chali͡uskintsaŭ"
|
30
|
+
test "Акадэмія навук", "Akadėmii͡a navuk"
|
31
|
+
test "Плошча Якуба Коласа", "Ploshcha I͡Akuba Kolasa"
|
32
|
+
test "Плошча Перамогі", "Ploshcha Peramohi"
|
33
|
+
test "Кастрычніцкая", "Kastrychnitskai͡a"
|
34
|
+
test "Плошча Леніна", "Ploshcha Lenina"
|
35
|
+
test "Інстытут Культуры", "Instytut Kulʹtury"
|
36
|
+
}
|
37
|
+
|
38
|
+
stage {
|
39
|
+
|
40
|
+
# CHARACTERS
|
41
|
+
parallel {
|
42
|
+
# Apostrophes
|
43
|
+
sub "\u00B4", "" # official english Apostrophe
|
44
|
+
sub "\u02BC", ""
|
45
|
+
sub "\u0027", "" # from belarussian keyboard
|
46
|
+
|
47
|
+
# Characters
|
48
|
+
sub "\u0410", "A" # A
|
49
|
+
sub "\u0411", "B" # Б
|
50
|
+
sub "\u0412", "V" # B
|
51
|
+
sub "\u0413", "H" # Г
|
52
|
+
sub "\u0490", "G" # Ґ
|
53
|
+
sub "\u0414", "D" # Д
|
54
|
+
sub "\u0415", "E" # Е
|
55
|
+
sub "\u0401", "I͡O" # Ё : I͡O
|
56
|
+
sub "\u0416", "Z͡H" # Ж : Z͡H
|
57
|
+
sub "\u0417", "Z" # З
|
58
|
+
sub "\u0406", "I" # І
|
59
|
+
sub "\u0419", "Ĭ" # Й : Ĭ
|
60
|
+
sub "\u041A", "K" # К
|
61
|
+
sub "\u041B", "L" # Л
|
62
|
+
sub "\u041C", "M" # М
|
63
|
+
sub "\u041D", "N" # Н
|
64
|
+
sub "\u041E", "O" # О
|
65
|
+
sub "\u041F", "P" # П
|
66
|
+
sub "\u0420", "R" # Р
|
67
|
+
sub "\u0421", "S" # С
|
68
|
+
sub "\u0422", "T" # Т
|
69
|
+
sub "\u0423", "U" # У
|
70
|
+
sub "\\U040E", "Ŭ" # Ў : Ŭ
|
71
|
+
sub "\u0424", "F" # Ф
|
72
|
+
sub "\u0425", "Kh" # Х
|
73
|
+
sub "\u0426", "Ts" # Ц
|
74
|
+
sub "\u0427", "Ch" # Ч
|
75
|
+
sub "\u0428", "Sh" # Ш
|
76
|
+
sub "\u042B", "Y" # Ы
|
77
|
+
sub "\u042C", "ʹ" # Ь : ʹ
|
78
|
+
sub "\u042D", "Ė" # Э : Ė
|
79
|
+
sub "\u042E", "I͡U" # Ю : I͡U
|
80
|
+
sub "\u042F", "I͡A" # Я : I͡A
|
81
|
+
|
82
|
+
sub "\u0430", "a" # а
|
83
|
+
sub "\u0431", "b" # б
|
84
|
+
sub "\u0432", "v" # в
|
85
|
+
sub "\u0433", "h" # г
|
86
|
+
sub "\u0491", "g" # ґ
|
87
|
+
sub "\u0434", "d" # д
|
88
|
+
sub "\u0435", "e" # е
|
89
|
+
sub "\u0451", "i͡o" # ё : i͡o
|
90
|
+
sub "\u0436", "z͡h" # ж : z͡h
|
91
|
+
sub "\u0437", "z" # з
|
92
|
+
sub "\u0456", "i" # і
|
93
|
+
sub "\u0439", "ĭ" # й : ĭ
|
94
|
+
sub "\u043A", "k" # к
|
95
|
+
sub "\u043B", "l" # л
|
96
|
+
sub "\u043C", "m" # м
|
97
|
+
sub "\u043D", "n" # н
|
98
|
+
sub "\u043E", "o" # о
|
99
|
+
sub "\u043F", "p" # п
|
100
|
+
sub "\u0440", "r" # р
|
101
|
+
sub "\u0441", "s" # с
|
102
|
+
sub "\u0442", "t" # т
|
103
|
+
sub "\u0443", "u" # у
|
104
|
+
sub "\u045E", "ŭ" # ў : ŭ
|
105
|
+
sub "\u0444", "f" # ф
|
106
|
+
sub "\u0445", "kh" # х
|
107
|
+
sub "\u0446", "ts" # Ц
|
108
|
+
sub "\u0447", "ch" # ч
|
109
|
+
sub "\u0448", "sh" # ш
|
110
|
+
sub "\u044B", "y" # ы
|
111
|
+
sub "\u044C", "ʹ" # ь : ʹ
|
112
|
+
sub "\u044D", "ė" # э : ė
|
113
|
+
sub "\u044E", "i͡u" # ю : i͡u
|
114
|
+
sub "\u044F", "i͡a" # я : i͡a
|
115
|
+
}
|
116
|
+
|
117
|
+
}
|
118
|
+
|
@@ -0,0 +1,225 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:ben
|
5
|
+
source_script: Beng
|
6
|
+
destination_script: Latn
|
7
|
+
name: Bengali Romanization, 1997
|
8
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/bengali.pdf
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Bengali
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are
|
16
|
+
listed; the forms used for vowels following a consonant can be found in
|
17
|
+
grammars; no distinction between the two is made in transliteration.
|
18
|
+
|
19
|
+
- |
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters
|
21
|
+
and is supplied in transliteration, with the following exceptions:
|
22
|
+
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
24
|
+
b) when the absence of any vowel is indicated by the subscript symbol ( ্ )
|
25
|
+
called hasanta or birāma.
|
26
|
+
|
27
|
+
- ব is used both as a labial and as a semivowel. When it occurs as the
|
28
|
+
second or subsequent consonant of a consonant cluster, it is
|
29
|
+
transliterated va. When ব is doubled, it is transliterated bba.
|
30
|
+
|
31
|
+
- Candrabindu before guttural, palatal, cerebral, and dental occlusives
|
32
|
+
is transliterated n̐. Before labials, sibilants, semivowels, the
|
33
|
+
aspirate, vowels, and in final position it is transliterated m̐.
|
34
|
+
|
35
|
+
- When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
|
36
|
+
}
|
37
|
+
|
38
|
+
tests {
|
39
|
+
test "আমার সোনার বাংলা, আমি তোমায় ভালোবাসি।\nচিরদিন তোমার আকাশ, তোমার বাতাস, আমার প্রাণে বাজায় বাঁশি॥\nও মা, ফাগুনে তোর আমের বনে ঘ্রাণে পাগল করে, মরি হায়, হায় রে—\nও মা, অঘ্রাণে তোর ভরা ক্ষেতে আমি কী দেখেছি মধুর হাসি॥\n\nকী শোভা, কী ছায়া গো, কী স্নেহ, কী মায়া গো—\nকী আঁচল বিছায়েছ বটের মূলে, নদীর কূলে কূলে।\nমা, তোর মুখের বাণী আমার কানে লাগে সুধার মতো,\nমরি হায়, হায় রে—\nমা, তোর বদনখানি মলিন হলে, ও মা, আমি নয়নজলে ভাসি॥", "āmāra sonāra bāṃlā, āmi tomāẏa bhālobāsi।\nciradina tomāra ākāśa, tomāra bātāsa, āmāra prāṇe bājāẏa bān̐śi॥\no mā, phāgune tora āmera bane ghrāṇe pāgala kare, mari hāẏa, hāẏa re—\no mā, aghrāṇe tora bharā kshete āmi kī dekhechi madhura hāsi॥\n\nkī śobhā, kī chāyaṛā go, kī sneha, kī māyaṛā go—\nkī ām̐cala bichāyaṛecha baṭera mūle, nadīra kūle kūle।\nmā, tora mukhera bāṇī āmāra kāne lāge sudhāra mato,\nmari hāẏa, hāẏa re—\nmā, tora badanakhāni malina hale, o mā, āmi naẏanajale bhāsi॥"
|
40
|
+
test "ট্রাম্প-বাইডেন মহারণ: জয় দাবি দুজনেরই", "ṭrāmpa-bāiḍena mahāraṇa: jaẏa dābi dujanerai"
|
41
|
+
test "রিপাবলিকান গভর্নর ডগ ডসি বলেছেন, ফলাফল নিয়ে এখনই কথা বলার সময় আসেনি।", "ripābalikāna gabharnara ḍaga ḍasi balechena, phalāphala niẏe ekhanai kathā balāra samaẏa āseni।"
|
42
|
+
test "অনেক আগে থেকেই ট্রাম্প ফ্লোরিডায় জিতে গেছেন বলে গণমাধ্যমগুলোতে তুলে ধরা হচ্ছে", "aneka āge thekei ṭrāmpa phloriḍāẏa jite gechena bale gaṇamādhyamagulote tule dharā hacche"
|
43
|
+
test "করোনায় আরও ২১ মৃত্যু, নতুন শনাক্ত ১৫১৭", "karonāẏa ārao 21 mṛtyu, natuna śanākta 1517"
|
44
|
+
test "শালিক পাখিকে পোষ মানানোর মতো কঠিন কাজ করা কিশোর রোহানের বাড়ি কুষ্টিয়া শহরের পিটিআই সড়কে।", "śālika pākhike posha mānānora mato kaṭhina kāja karā kiśora rohānera bāṛi kushṭiẏā śaharera piṭiāi saṛake।"
|
45
|
+
test "সুইং স্টেটের সর্বশেষ অবস্থা দেখে মনে হচ্ছে, দুজনের ভাগ্য দুলছে পেন্ডুলামে।", "suiṃ sṭeṭera sarbaśesha abasthā dekhe mane hacche, dujanera bhāgya dulache penḍulāme।"
|
46
|
+
test "২০১৬ সালের নির্বাচনে বহিরাগত হিসেবেই ডোনাল্ড ট্রাম্পের রাজনীতিতে আগমন", "2016 sālera nirbācane bahirāgata hisebei ḍonālḍa ṭrāmpera rājanītite āgamana"
|
47
|
+
test "কই সঙ্গে রাজনীতির পাদপ্রদীপ থেকে সম্পূর্ণ বাইরে থাকা তাঁর পরিবারও চলে আসে রাজনীতির আলোচনায়", "kai saṅge rājanītira pādapradīpa theke sampūrṇa bāire thākā tān̐ra paribārao cale āse rājanītira ālocanāẏa"
|
48
|
+
test "নির্বাচনী প্রচারের সময় প্রেসিডেন্ট ডোনাল্ড ট্রাম্পের পরিবারের সদস্যরা মাঠে নেমেছেন", "nirbācanī pracārera samaẏa presiḍenṭa ḍonālḍa ṭrāmpera paribārera sadasyarā māṭhe nemechena"
|
49
|
+
test "তাঁরা সমর্থকদের উদ্দেশ্যে বলেছেন, এ নির্বাচন শুধু প্রেসিডেন্ট ডোনাল্ড ট্রাম্পের প্রতি নয়", "tān̐rā samarthakadera uddeśye balechena, e nirbācana śudhu presiḍenṭa ḍonālḍa ṭrāmpera prati naẏa"
|
50
|
+
test "স্মার্টফোন কিনতে ৮ হাজার করে ঋণ পাবেন ৪১৫০১ শিক্ষার্থী", "smārṭaphona kinate 8 hājāra kare ṛṇa pābena 41501 śikshārthī"
|
51
|
+
test "বার্সা সমর্থকদের নিয়ে উদ্যাপনের কথা গিলতে হলো ভিদালকে", "bārsā samarthakadera niẏe udyāpanera kathā gilate halo bhidālake"
|
52
|
+
test "য়ে", "yaṛe"
|
53
|
+
}
|
54
|
+
|
55
|
+
aliases {
|
56
|
+
# A different name for this alias can be more fitting...
|
57
|
+
def_alias ben_special, any("\u09be\u09bf\u09c0\u09c1\u09c2\u09c3\u09c7\u09c8\u09cb\u09cc\u09cd")
|
58
|
+
}
|
59
|
+
|
60
|
+
stage {
|
61
|
+
# RULES
|
62
|
+
#rule II
|
63
|
+
sub "ক", "k", after: ben_special
|
64
|
+
sub "খ", "kh", after: ben_special
|
65
|
+
sub "গ", "g", after: ben_special
|
66
|
+
sub "ঘ", "gh", after: ben_special
|
67
|
+
sub "ঙ", "ṅ", after: ben_special
|
68
|
+
sub "চ", "c", after: ben_special
|
69
|
+
sub "ছ", "ch", after: ben_special
|
70
|
+
sub "জ", "j", after: ben_special
|
71
|
+
sub "ঝ", "jh", after: ben_special
|
72
|
+
sub "ঞ", "ñ", after: ben_special
|
73
|
+
sub "ট", "ṭ", after: ben_special
|
74
|
+
sub "ঠ", "ṭh", after: ben_special
|
75
|
+
sub "ড", "ḍ", after: ben_special
|
76
|
+
sub "ড়", "ṛ", after: ben_special
|
77
|
+
sub any("ড়"), "ṛ", after: ben_special # 2 combining characters, why we need any()? - weird
|
78
|
+
sub "ঢ", "ḍh", after: ben_special
|
79
|
+
sub "ঢ়", "ṛh", after: ben_special # 2 combining characters, was any()
|
80
|
+
sub "ণ", "ṇ", after: ben_special
|
81
|
+
sub "ত", "t", after: ben_special
|
82
|
+
sub "ৎ", "ṯ", after: ben_special
|
83
|
+
sub "থ", "th", after: ben_special
|
84
|
+
sub "দ", "d", after: ben_special
|
85
|
+
sub "ধ", "dh", after: ben_special
|
86
|
+
sub "ন", "n", after: ben_special
|
87
|
+
sub "প", "p", after: ben_special
|
88
|
+
sub "ফ", "ph", after: ben_special
|
89
|
+
sub "ব", "b", after: ben_special
|
90
|
+
sub "ভ", "bh", after: ben_special
|
91
|
+
sub "ম", "m", after: ben_special
|
92
|
+
sub "য", "y", after: ben_special
|
93
|
+
sub "য়", "ẏ", after: ben_special # 2 combining characters
|
94
|
+
sub "য়", "ẏ", after: ben_special # But this was any() in the previous version
|
95
|
+
sub "র", "r", after: ben_special
|
96
|
+
sub "ল", "l", after: ben_special
|
97
|
+
sub "শ", "ś", after: ben_special
|
98
|
+
sub "ষ", "sh", after: ben_special
|
99
|
+
sub "স", "s", after: ben_special
|
100
|
+
sub "হ", "h", after: ben_special
|
101
|
+
|
102
|
+
# Rule III
|
103
|
+
sub "ବ", "bba", after: "\u09AC"
|
104
|
+
# Rule V
|
105
|
+
sub "\u0981", "m̐", after: any("কখগঘঙচছজঝঞটঠডডঢঢণতৎথদধন")
|
106
|
+
sub "\u0b01", "m̐", after: boundary
|
107
|
+
|
108
|
+
|
109
|
+
# CHARACTERS
|
110
|
+
parallel {
|
111
|
+
|
112
|
+
# Vowels and Diphthongs
|
113
|
+
|
114
|
+
sub "অ", "a"
|
115
|
+
sub "আ", "ā"
|
116
|
+
sub "ই", "i"
|
117
|
+
sub "ঈ", "ī"
|
118
|
+
sub "উ", "u"
|
119
|
+
sub "ঊ", "ū"
|
120
|
+
sub "এ", "e"
|
121
|
+
sub "ঐ", "ai"
|
122
|
+
sub "ও", "o"
|
123
|
+
sub "ঔ", "au"
|
124
|
+
sub "ঋ", "ṛ"
|
125
|
+
sub "ৠ", "ṝ"
|
126
|
+
sub "ঌ", "ḹ"
|
127
|
+
|
128
|
+
# Consonants
|
129
|
+
# Gutturals
|
130
|
+
sub "ক", "ka"
|
131
|
+
sub "খ", "kha"
|
132
|
+
sub "গ", "ga"
|
133
|
+
sub "ঘ", "gha"
|
134
|
+
sub "ঙ", "ṅa"
|
135
|
+
|
136
|
+
# Palatals
|
137
|
+
sub "চ", "ca"
|
138
|
+
sub "ছ", "cha"
|
139
|
+
sub "জ", "ja"
|
140
|
+
sub "ঝ", "jha"
|
141
|
+
sub "ঞ", "ña"
|
142
|
+
|
143
|
+
# Cerebrals
|
144
|
+
sub "ট", "ṭa"
|
145
|
+
sub "ঠ", "ṭha"
|
146
|
+
sub "ড", "ḍa"
|
147
|
+
sub "ড়", "ṛa"
|
148
|
+
sub "ড়", "ṛa"
|
149
|
+
sub "ঢ", "ḍha"
|
150
|
+
sub "ঢ়", "ṛha"
|
151
|
+
sub "ণ", "ṇa"
|
152
|
+
|
153
|
+
# Dentals
|
154
|
+
sub "ত", "ta"
|
155
|
+
sub "ৎ", "ṯa"
|
156
|
+
sub "থ", "tha"
|
157
|
+
sub "দ", "da"
|
158
|
+
sub "ধ", "dha"
|
159
|
+
sub "ন", "na"
|
160
|
+
|
161
|
+
# Labials
|
162
|
+
sub "প", "pa"
|
163
|
+
sub "ফ", "pha"
|
164
|
+
sub "ব", "ba" # see Note 3
|
165
|
+
sub "ভ", "bha"
|
166
|
+
sub "ম", "ma"
|
167
|
+
|
168
|
+
# Semivowels
|
169
|
+
sub "য", "ya"
|
170
|
+
sub "য়", "ẏa"
|
171
|
+
sub "য়", "ẏa"
|
172
|
+
sub "র", "ra"
|
173
|
+
sub "ল", "la"
|
174
|
+
|
175
|
+
# Sibilants
|
176
|
+
sub "শ", "śa"
|
177
|
+
sub "ষ", "sha"
|
178
|
+
sub "স", "sa"
|
179
|
+
|
180
|
+
# Aspirate
|
181
|
+
sub "হ", "ha"
|
182
|
+
|
183
|
+
# Anusvāra
|
184
|
+
sub "ং", "ṃ"
|
185
|
+
|
186
|
+
# Bisarga
|
187
|
+
sub "ঃ", "ḥ"
|
188
|
+
|
189
|
+
# Candrabindu (anunāsika)
|
190
|
+
sub "\u0981", "n̐"
|
191
|
+
|
192
|
+
# Abagraha (see Note 5)
|
193
|
+
sub "ऽ", "’" # (apostrophe)
|
194
|
+
|
195
|
+
|
196
|
+
# Medials # Needed for connecting constants
|
197
|
+
|
198
|
+
sub "\u09be", "ā"
|
199
|
+
sub "\u09bf", "i"
|
200
|
+
sub "\u09c0", "ī"
|
201
|
+
sub "\u09c1", "u"
|
202
|
+
sub "\u09c2", "ū"
|
203
|
+
sub "\u09c3", "ṛ"
|
204
|
+
sub "\u09c7", "e"
|
205
|
+
sub "\u09c8", "ai"
|
206
|
+
sub "\u09cb", "o"
|
207
|
+
sub "\u09cc", "au"
|
208
|
+
sub "\u09cd", ""
|
209
|
+
|
210
|
+
#Numbers
|
211
|
+
|
212
|
+
sub "০", "0"
|
213
|
+
sub "১", "1"
|
214
|
+
sub "২", "2"
|
215
|
+
sub "৩", "3"
|
216
|
+
sub "৪", "4"
|
217
|
+
sub "৫", "5"
|
218
|
+
sub "৬", "6"
|
219
|
+
sub "৭", "7"
|
220
|
+
sub "৮", "8"
|
221
|
+
sub "৯", "9"
|
222
|
+
}
|
223
|
+
|
224
|
+
compose
|
225
|
+
}
|
@@ -0,0 +1,135 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: alalc
|
3
|
+
id: 2017
|
4
|
+
language: iso-639-2:ben
|
5
|
+
source_script: Beng
|
6
|
+
destination_script: Latn
|
7
|
+
name: Bengali Romanization, 2017
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/bengali.pdf
|
9
|
+
creation_date: 2017
|
10
|
+
description: |
|
11
|
+
ALA-LC Romanization table for Bengali
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are
|
16
|
+
listed; the forms used for vowels following a consonant can be found in
|
17
|
+
grammars; no distinction between the two is made in transliteration.
|
18
|
+
|
19
|
+
- |
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters
|
21
|
+
and is supplied in transliteration, with the following exceptions:
|
22
|
+
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
24
|
+
b) when the absence of any vowel is indicated by the subscript symbol ( ্ )
|
25
|
+
called hasanta or birāma.
|
26
|
+
|
27
|
+
- ব is used both as a labial and as a semivowel. When it occurs as the
|
28
|
+
second or subsequent consonant of a consonant cluster, it is
|
29
|
+
transliterated va. When ব is doubled, it is transliterated bba.
|
30
|
+
|
31
|
+
- Candrabindu before guttural, palatal, cerebral, and dental occlusives
|
32
|
+
is transliterated n̐. Before labials, sibilants, semivowels, the
|
33
|
+
aspirate, vowels, and in final position it is transliterated m̐.
|
34
|
+
|
35
|
+
- When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
|
36
|
+
}
|
37
|
+
|
38
|
+
tests {
|
39
|
+
test "র্ক", "rka"
|
40
|
+
test "গ্র", "gra"
|
41
|
+
test "ত্য", "tya"
|
42
|
+
}
|
43
|
+
|
44
|
+
dependency "un-ben-Beng-Latn-2016", as: benglatn
|
45
|
+
|
46
|
+
|
47
|
+
stage {
|
48
|
+
run map.benglatn.stage.main
|
49
|
+
|
50
|
+
# CHARACTERS
|
51
|
+
parallel {
|
52
|
+
|
53
|
+
# I. Vowels and Diphthongs (see Note 1)
|
54
|
+
|
55
|
+
sub "অ", "a"
|
56
|
+
sub "ৠ", "ṝ"
|
57
|
+
sub "আ", "ā"
|
58
|
+
sub "ঌ", "ḹ"
|
59
|
+
sub "ই", "I"
|
60
|
+
sub "এ", "e"
|
61
|
+
sub "ঈ", "ī"
|
62
|
+
sub "ঐ", "ai"
|
63
|
+
sub "উ", "u"
|
64
|
+
sub "ও", "o"
|
65
|
+
sub "ঊ", "ū"
|
66
|
+
sub "ঔ", "au"
|
67
|
+
sub "ঋ", "ṛ"
|
68
|
+
|
69
|
+
# II. Consonants (see Note 2)
|
70
|
+
# Gutturals
|
71
|
+
sub "ক", "ka"
|
72
|
+
sub "খ", "kha"
|
73
|
+
sub "গ", "ga"
|
74
|
+
sub "ঘ", "gha"
|
75
|
+
sub "ঙ", "ṅa"
|
76
|
+
|
77
|
+
# Palatals
|
78
|
+
sub "চ", "ca"
|
79
|
+
sub "ছ", "cha"
|
80
|
+
sub "জ", "ja"
|
81
|
+
sub "ঝ", "jha"
|
82
|
+
sub "ঞ", "ña"
|
83
|
+
|
84
|
+
# Cerebrals
|
85
|
+
sub "ট", "ṭa"
|
86
|
+
sub "ঠ", "ṭha"
|
87
|
+
sub "ড", "ḍa"
|
88
|
+
sub "ড়", "ṛa"
|
89
|
+
sub "ঢ", "ḍha"
|
90
|
+
sub "ঢ়", "ṛha"
|
91
|
+
sub "ণ", "ṇa"
|
92
|
+
|
93
|
+
# Dentals
|
94
|
+
sub "ত", "ta"
|
95
|
+
sub "ৎ", "t"
|
96
|
+
sub "থ", "tha"
|
97
|
+
sub "দ", "da"
|
98
|
+
sub "ধ", "dha"
|
99
|
+
sub "ন", "na"
|
100
|
+
|
101
|
+
# Labials
|
102
|
+
sub "প", "pa"
|
103
|
+
sub "ফ", "pha"
|
104
|
+
sub "ব", "ba" # see Note 3
|
105
|
+
sub "ভ", "bha"
|
106
|
+
sub "ম", "ma"
|
107
|
+
|
108
|
+
# Semivowels
|
109
|
+
sub "য", "ya"
|
110
|
+
sub "য়", "ẏa"
|
111
|
+
sub "র", "ra"
|
112
|
+
sub "ল", "la"
|
113
|
+
sub "ব", "ba" # see Note 3
|
114
|
+
|
115
|
+
# Sibilants
|
116
|
+
sub "শ", "śa"
|
117
|
+
sub "ষ", "sha"
|
118
|
+
sub "স", "sa"
|
119
|
+
|
120
|
+
# Aspirate
|
121
|
+
sub "হ", "ha"
|
122
|
+
|
123
|
+
# Anusvāra
|
124
|
+
sub " ং", "ṃ"
|
125
|
+
|
126
|
+
# Bisarga
|
127
|
+
sub " ঃ", "ḥ"
|
128
|
+
|
129
|
+
# Candrabindu (anunāsika) see note 4
|
130
|
+
sub "\u0981", "n̐" # ঁ : n̐, m̐
|
131
|
+
|
132
|
+
# Abagraha (see Note 5)
|
133
|
+
sub "ऽ", "’" # (apostrophe)
|
134
|
+
}
|
135
|
+
}
|