interscript 0.1.3 → 0.1.9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.adoc +10 -11
- data/aliases.json +1 -0
- data/lib/interscript.rb +62 -59
- data/lib/interscript/command.rb +3 -2
- data/lib/interscript/fs.rb +96 -0
- data/lib/interscript/mapping.rb +36 -17
- data/lib/interscript/opal.rb +196 -0
- data/lib/interscript/opal/entrypoint.rb +20 -0
- data/lib/interscript/opal/exports.rb +11 -0
- data/lib/interscript/opal/maps.js.erb +8 -0
- data/lib/interscript/version.rb +1 -1
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +6 -2
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
- data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
- data/maps/alalc-asm-Deva-Latn-1997.yaml +259 -0
- data/maps/alalc-asm-Deva-Latn-2012.yaml +55 -0
- data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
- data/maps/{alalc-bel-cyrl-latn-1997.yaml → alalc-bel-Cyrl-Latn-1997.yaml} +7 -3
- data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
- data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
- data/maps/alalc-ell-Grek-Latn-1997.yaml +7 -4
- data/maps/alalc-ell-Grek-Latn-2010.yaml +3 -5
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +303 -0
- data/maps/alalc-hin-Deva-Latn-2011.yaml +65 -0
- data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
- data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +2 -3
- data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
- data/maps/alalc-kor-Hang-Latn-1997.yaml +6 -2
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
- data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
- data/maps/{alalc-mkd-cyrl-latn-1997.yaml → alalc-mkd-Cyrl-Latn-1997.yaml} +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
- data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
- data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
- data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
- data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
- data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
- data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
- data/maps/alalc-san-Deva-Latn-2012.yaml +241 -0
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
- data/maps/{alalc-srp-cyrl-latn-2013.yaml → alalc-srp-Cyrl-Latn-2013.yaml} +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
- data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
- data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
- data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
- data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -2
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -3
- data/maps/bgn-kor-Hang-Latn-1943.yaml +8 -4
- data/maps/bgn-kor-Kore-Latn-1943.yaml +4 -4
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +598 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
- data/maps/{bgnpcgn-bel-cyrl-latn-1979.yaml → bgnpcgn-bel-Cyrl-Latn-1979.yaml} +5 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +14 -10
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +8 -5
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -2
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
- data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +18 -18
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +3 -3
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +3 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +2 -2
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +338 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +673 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -2
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
- data/maps/{bgnpcgn-chn-Hans-Latn-1979.yaml → bgnpcgn-zho-Hans-Latn-1979.yaml} +1 -1
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +173 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +175 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
- data/maps/by-bel-Cyrl-Latn-1998.yaml +9 -5
- data/maps/by-bel-Cyrl-Latn-2007.yaml +4 -4
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
- data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +7 -8
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +6 -7
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -3
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -3
- data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -2
- data/maps/{gki-bel-cyrl-latn-1992.yaml → gki-bel-Cyrl-Latn-1992.yaml} +2 -2
- data/maps/{gki-bel-cyrl-latn-2000.yaml → gki-bel-Cyrl-Latn-2000.yaml} +2 -2
- data/maps/{gost-rus-cyrl-latn-16876-71-1983.yaml → gost-rus-Cyrl-Latn-16876-71-1983.yaml} +8 -4
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -6
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -5
- data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -2
- data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +11 -8
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -5
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +220 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -4
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +2 -2
- data/maps/kp-kor-Hang-Latn-2002.yaml +29 -21
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +3 -3
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +163 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +200 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
- data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
- data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
- data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
- data/maps/odni-ara-Arab-Latn-2015.yaml +315 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
- data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
- data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
- data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
- data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
- data/maps/odni-kat-Geor-Latn-2015.yaml +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
- data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
- data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
- data/maps/odni-prs-Arab-Latn-2015.yaml +228 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +6 -2
- data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +5 -5
- data/maps/royin-tha-Thai-Latn-1968.yaml +9 -5
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +5 -5
- data/maps/royin-tha-Thai-Latn-1999.yaml +8 -4
- data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
- data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
- data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
- data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
- data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
- data/maps/un-bel-Cyrl-Latn-2007.yaml +4 -4
- data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
- data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +44 -44
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +3 -4
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -4
- data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
- data/maps/un-hin-Deva-Latn-2016.yaml +316 -0
- data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
- data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +102 -0
- data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +269 -0
- data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
- data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
- data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
- data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +2 -2
- data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
- data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
- data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
- data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +4 -4
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +4 -4
- data/maps/var-kor-Kore-Hang-2013.yaml +2 -2
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +2 -3
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
- data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
- data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
- data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
- data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +6 -6
- data/maps/var-tha-Thai-Zsym-ipa.yaml +13 -13
- data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +13 -9
- data/spec/interscript/filenames_spec.rb +21 -0
- data/spec/interscript_spec.rb +16 -5
- metadata +275 -27
- data/bin/interscript +0 -41
- data/bin/rspec +0 -29
- data/bin/setup +0 -8
- data/maps/un-mon-Mong-Latn-2013.yaml +0 -93
- data/maps/un-ukr-cyrl-latn-1998.yaml +0 -30
|
@@ -0,0 +1,127 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 1979
|
|
4
|
+
language: iso-639-2:uzb
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: BGN/PCGN Romanization System -- Uzbek Cyrillic (1979)
|
|
8
|
+
url: http://transliteration.eki.ee/pdf/Uzbek.pdf
|
|
9
|
+
creation_date: 1979
|
|
10
|
+
|
|
11
|
+
notes:
|
|
12
|
+
- At the beginning of a syllable, after a vowel, ъ or ь.
|
|
13
|
+
|
|
14
|
+
tests:
|
|
15
|
+
# https://ru.wikipedia.org/wiki/Узбекский_язык
|
|
16
|
+
- source: Ўзбек ёзуви
|
|
17
|
+
expected: Ŭzbek yozuwi
|
|
18
|
+
- source: Ўзбек тили
|
|
19
|
+
expected: Ŭzbek tili
|
|
20
|
+
- source: катта
|
|
21
|
+
expected: katta
|
|
22
|
+
- source: куп
|
|
23
|
+
expected: kup
|
|
24
|
+
- source: кальта
|
|
25
|
+
expected: kalʼta
|
|
26
|
+
- source: Бори элға яхшилик қилғилки, мундин яхши йўқ Ким, дегайлар даҳр аро қолди фалондин яхшилик
|
|
27
|
+
expected: Bori elgha yakhshilik qilghilki, mundin yakhshi yŭq Kim, degaylar dahr aro qoldi falondin yakhshilik
|
|
28
|
+
- source: Бахр ул-худо
|
|
29
|
+
expected: Bakhr ul-khudo
|
|
30
|
+
- source: Рисале-йи маариф-и Шейбани
|
|
31
|
+
expected: Risale-yi maarif-i Sheybani
|
|
32
|
+
- source: Карами Хакка нихоят йукдур
|
|
33
|
+
expected: Karami Khakka nikhoyat yukdur
|
|
34
|
+
- source: Йахши
|
|
35
|
+
expected: Yakhshi
|
|
36
|
+
- source: Тутук белгись
|
|
37
|
+
expected: Tutuk belgisʼ
|
|
38
|
+
- source: |
|
|
39
|
+
Барча одамлар эркин, қадр-қиммат ва ҳуқуқларда тенг бўлиб туғиладилар.
|
|
40
|
+
Улар ақл ва виждон соҳибидирлар ва бир-бирлари ила биродарларча муомала қилишлари зарур.
|
|
41
|
+
expected: |
|
|
42
|
+
Barcha odamlar erkin, qadr-qimmat wa huquqlarda teng bŭlib tughiladilar.
|
|
43
|
+
Ular aql wa wizhdon sohibidirlar wa bir-birlari ila birodarlarcha muomala qilishlari zarur.
|
|
44
|
+
- source: ПАПАПАЧУКА Респект!
|
|
45
|
+
expected: PAPAPACHUKA Respekt!
|
|
46
|
+
|
|
47
|
+
map:
|
|
48
|
+
rules:
|
|
49
|
+
# note[1]
|
|
50
|
+
- pattern: (?<=[АаЕеЁёИиОоУуЭэЮюЯяЪъЬь])\u0415
|
|
51
|
+
result: Ye
|
|
52
|
+
- pattern: (?<=[АаЕеЁёИиОоУуЭэЮюЯяЪъЬь])\u0435
|
|
53
|
+
result: ye
|
|
54
|
+
|
|
55
|
+
characters:
|
|
56
|
+
'\u0410': 'A' # А
|
|
57
|
+
'\u0411': 'B' # Б
|
|
58
|
+
'\u0412': 'W' # В
|
|
59
|
+
'\u0413': 'G' # Г
|
|
60
|
+
'\u0492': 'Gh' # Ғ
|
|
61
|
+
'\u0414': 'D' # Д
|
|
62
|
+
'\u0415': 'E' # Е
|
|
63
|
+
'\u0401': 'Yo' # Ё
|
|
64
|
+
'\u0416': 'Zh' # Ж
|
|
65
|
+
'\u0417': 'Z' # З
|
|
66
|
+
'\u0418': 'I' # И
|
|
67
|
+
'\u0419': 'Y' # Й
|
|
68
|
+
'\u041A': 'K' # К
|
|
69
|
+
'\u049A': 'Q' # Қ
|
|
70
|
+
'\u041B': 'L' # Л
|
|
71
|
+
'\u041C': 'M' # М
|
|
72
|
+
'\u041D': 'N' # Н
|
|
73
|
+
'\u041E': 'O' # О
|
|
74
|
+
'\u041F': 'P' # П
|
|
75
|
+
'\u0420': 'R' # Р
|
|
76
|
+
'\u0421': 'S' # С
|
|
77
|
+
'\u0422': 'T' # Т
|
|
78
|
+
'\u0423': 'U' # У
|
|
79
|
+
'\u040E': 'Ŭ' # Ў
|
|
80
|
+
'\u0424': 'F' # Ф
|
|
81
|
+
'\u0425': 'Kh' # Х
|
|
82
|
+
'\u04B2': 'H' # Ҳ
|
|
83
|
+
'\u0426': 'Ts' # Ц
|
|
84
|
+
'\u0427': 'Ch' # Ч
|
|
85
|
+
'\u0428': 'Sh' # Ш
|
|
86
|
+
'\u042a': "\u02BC" # Ъ
|
|
87
|
+
'\u042c': "\u02BC" # Ь
|
|
88
|
+
'\u042D': 'E' # Э
|
|
89
|
+
'\u042E': 'Yu' # Ю
|
|
90
|
+
'\u042F': 'Ya' # Я
|
|
91
|
+
|
|
92
|
+
'\u0430': 'a' # а
|
|
93
|
+
'\u0431': 'b' # б
|
|
94
|
+
'\u0432': 'w' # в
|
|
95
|
+
'\u0433': 'g' # г
|
|
96
|
+
'\u0493': 'gh' # ғ
|
|
97
|
+
'\u0434': 'd' # д
|
|
98
|
+
'\u0435': 'e' # e
|
|
99
|
+
'\u0451': 'yo' # ё
|
|
100
|
+
'\u0436': 'zh' # ж
|
|
101
|
+
'\u0437': 'z' # з
|
|
102
|
+
'\u0438': 'i' # и
|
|
103
|
+
'\u0439': 'y' # й
|
|
104
|
+
'\u043A': 'k' # к
|
|
105
|
+
'\u049B': 'q' # қ
|
|
106
|
+
'\u043B': 'l' # л
|
|
107
|
+
'\u043C': 'm' # м
|
|
108
|
+
'\u043D': 'n' # н
|
|
109
|
+
'\u043E': 'o' # о
|
|
110
|
+
'\u043F': 'p' # п
|
|
111
|
+
'\u0440': 'r' # р
|
|
112
|
+
'\u0441': 's' # с
|
|
113
|
+
'\u0442': 't' # т
|
|
114
|
+
'\u0443': 'u' # у
|
|
115
|
+
'\u045E': 'ŭ' # ў
|
|
116
|
+
'\u0444': 'f' # ф
|
|
117
|
+
'\u0445': 'kh' # х
|
|
118
|
+
'\u04B3': 'h' # ҳ
|
|
119
|
+
'\u0446': 'ts' # ц
|
|
120
|
+
'\u0447': 'ch' # ч
|
|
121
|
+
'\u0448': 'sh' # ш
|
|
122
|
+
'\u044a': "\u02BC" # ъ
|
|
123
|
+
'\u044c': "\u02BC" # ь
|
|
124
|
+
'\u044D': 'e' # э
|
|
125
|
+
'\u044F': 'ya' # я
|
|
126
|
+
'\u044E': 'yu' # ю
|
|
127
|
+
|
|
@@ -0,0 +1,82 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 2000
|
|
4
|
+
language: iso-639-2:uzb
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: TABLE OF CORRESPONDENCES CYRILLIC - ROMAN BGN/PCGN 2000 Agreement
|
|
8
|
+
description: |
|
|
9
|
+
In 1995, the Uzbek government adopted the Roman alphabet to replace the existing Cyrillic alphabet.
|
|
10
|
+
The presentation below provides a table of correspondences between the former Cyrillic alphabet and the
|
|
11
|
+
current Roman alphabet. When Uzbek Roman-alphabet spellings are not available, this table can be used to
|
|
12
|
+
convert Uzbek Cyrillic spellings. This table of correspondences supersedes the BGN/PCGN 1979 romanization
|
|
13
|
+
system for Uzbek.
|
|
14
|
+
url: http://transliteration.eki.ee/pdf/Uzbek.pdf
|
|
15
|
+
creation_date: 2000
|
|
16
|
+
confirmation_date: 2017-11
|
|
17
|
+
|
|
18
|
+
notes:
|
|
19
|
+
- The letter sequence ye is used initially, after the vowel characters 1, 6, 7, 10, 16, 21, 29, 30, 31, and 32, and after characters 11 and 28.
|
|
20
|
+
- The Unicode encoding of the apostrophe appearing in rows 27 and 28 is U+2019. The inverted apostrophe appearing in rows 32 (o‘) and 34 (g‘) is U+2018.
|
|
21
|
+
- The Roman-script columns show only lowercase forms but, when applying the table, uppercase and lowercase Roman letters as appropriate should be used.
|
|
22
|
+
|
|
23
|
+
tests:
|
|
24
|
+
# https://ru.wikipedia.org/wiki/Узбекский_язык
|
|
25
|
+
- source: Ўзбек ёзуви
|
|
26
|
+
expected: O‘zbek yozuwi
|
|
27
|
+
- source: Ўзбек тили
|
|
28
|
+
expected: O‘zbek tili
|
|
29
|
+
- source: катта
|
|
30
|
+
expected: katta
|
|
31
|
+
- source: куп
|
|
32
|
+
expected: kup
|
|
33
|
+
- source: кальта
|
|
34
|
+
expected: kal’ta
|
|
35
|
+
- source: Бори элға яхшилик қилғилки, мундин яхши йўқ Ким, дегайлар даҳр аро қолди фалондин яхшилик
|
|
36
|
+
expected: Bori elg‘a yaxshilik qilg‘ilki, mundin yaxshi yo‘q Kim, degaylar dahr aro qoldi falondin yaxshilik
|
|
37
|
+
- source: Бахр ул-худо
|
|
38
|
+
expected: Baxr ul-xudo
|
|
39
|
+
- source: Рисале-йи маариф-и Шейбани
|
|
40
|
+
expected: Risale-yi maarif-i Sheybani
|
|
41
|
+
- source: Карами Хакка нихоят йукдур
|
|
42
|
+
expected: Karami Xakka nixoyat yukdur
|
|
43
|
+
- source: Йахши
|
|
44
|
+
expected: Yaxshi
|
|
45
|
+
- source: Тутук белгись
|
|
46
|
+
expected: Tutuk belgis’
|
|
47
|
+
- source: |
|
|
48
|
+
Барча одамлар эркин, қадр-қиммат ва ҳуқуқларда тенг бўлиб туғиладилар.
|
|
49
|
+
Улар ақл ва виждон соҳибидирлар ва бир-бирлари ила биродарларча муомала қилишлари зарур.
|
|
50
|
+
expected: |
|
|
51
|
+
Barcha odamlar erkin, qadr-qimmat wa huquqlarda teng bo‘lib tug‘iladilar.
|
|
52
|
+
Ular aql wa wijdon sohibidirlar wa bir-birlari ila birodarlarcha muomala qilishlari zarur.
|
|
53
|
+
- source: ПАПАПАЧУКА Респект!
|
|
54
|
+
expected: PAPAPACHUKA Respekt!
|
|
55
|
+
|
|
56
|
+
map:
|
|
57
|
+
inherit: bgnpcgn-uzb-Cyrl-Latn-1979
|
|
58
|
+
|
|
59
|
+
rules:
|
|
60
|
+
# note[1]
|
|
61
|
+
- pattern: (?<=[АаЕеЁёИиОоУуЭэЮюЯяЙйЬь])\u0415
|
|
62
|
+
result: Ye
|
|
63
|
+
- pattern: (?<=[АаЕеЁёИиОоУуЭэЮюЯяЙйЬь])\u0435
|
|
64
|
+
result: ye
|
|
65
|
+
|
|
66
|
+
characters:
|
|
67
|
+
'\u0412': 'V' # В
|
|
68
|
+
'\u0492': "G\u2018" # Ғ
|
|
69
|
+
'\u0416': 'J' # Ж
|
|
70
|
+
'\u040E': "O\u2018" # Ў
|
|
71
|
+
'\u0425': 'X' # Х
|
|
72
|
+
'\u042a': "\u2019" # Ъ note[2]
|
|
73
|
+
'\u042c': "\u2019" # Ь note[2]
|
|
74
|
+
|
|
75
|
+
'\u0432': 'w' # в
|
|
76
|
+
'\u0493': "g\u2018" # ғ
|
|
77
|
+
'\u0436': 'j' # ж
|
|
78
|
+
'\u045E': "o\u2018" # ў
|
|
79
|
+
'\u0445': 'x' # х
|
|
80
|
+
'\u044a': "\u2019" # ъ note[2]
|
|
81
|
+
'\u044c': "\u2019" # ь note[2]
|
|
82
|
+
|
|
@@ -0,0 +1,159 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bis
|
|
3
|
+
id: 1991
|
|
4
|
+
language: iso-639-2:asm
|
|
5
|
+
source_script: Beng
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Indian script code for information interchange - ISCII - Assamese Romanization
|
|
8
|
+
#url:
|
|
9
|
+
creation_date: 1991
|
|
10
|
+
description: |
|
|
11
|
+
IS 13194 (1991): Indian script code for information
|
|
12
|
+
interchange - ISCII [LITD 20: Indian Language Technologies
|
|
13
|
+
and Products]
|
|
14
|
+
|
|
15
|
+
notes:
|
|
16
|
+
- |
|
|
17
|
+
Exception: Anusvāra is transliterated by:
|
|
18
|
+
|
|
19
|
+
a) ṅ before gutturals,
|
|
20
|
+
b) ñ before palatals,
|
|
21
|
+
c) ṇ before cerebrals,
|
|
22
|
+
d) n before dentals, and
|
|
23
|
+
e) m before labials.
|
|
24
|
+
|
|
25
|
+
tests:
|
|
26
|
+
- source: "অসমীয়া কবিতা"
|
|
27
|
+
expected: "asmīẏā kbitā"
|
|
28
|
+
- source: "কবিৰ আজি জন্মদিন"
|
|
29
|
+
expected: "kbir āji jnmdin"
|
|
30
|
+
- source: "বেৰুটত এমাহৰ পাছতে পুনৰ ভয়ংকৰ অগ্নিকাণ্ড"
|
|
31
|
+
expected: "bēruṭt ēmāhr pāchtē punr bhẏṅkr agnikāṇḍ"
|
|
32
|
+
- source: "ভঙাৰ বিৰুদ্ধে আৱেদন দাখিল কংগনাৰ"
|
|
33
|
+
expected: "bhṅār biruddhē āvēdn dākhil kṅgnār"
|
|
34
|
+
- source: "আপুনি পঢ়ি ভাল পাব পৰা বাতৰি"
|
|
35
|
+
expected: "āpuni pd̂hi bhāl pāb prā bātri"
|
|
36
|
+
- source: "শ্ৰীৰামপুৰত গৰুভৰ্তি ট্ৰাক জব্দ, দুজনক আটক"
|
|
37
|
+
expected: "śrīrāmpurt grubhrti ṭrāk jbd, dujnk āṭk"
|
|
38
|
+
- source: "কেনে আছে প্ৰাক্তন"
|
|
39
|
+
expected: "kēnē āchē prāktn"
|
|
40
|
+
- source: "কমুম্বাইৰ মেয়ৰৰ দেহত কোভিড পজিটিভ"
|
|
41
|
+
expected: "kmumbāir mēẏrr dēht kŏbhiḍ pjiṭibh"
|
|
42
|
+
- source: "টুইটাৰযোগে খোদ সদৰী কৰে এই কথা"
|
|
43
|
+
expected: "ṭuiṭāryŏgē khŏd sdrī krē ēi kthā"
|
|
44
|
+
- source: "লখিমপুৰ জিলাৰ নাৰায়ণপুৰৰ বৰপথাৰত আজি প্ৰশান্তি ধাম নামেৰে এখন বৃদ্ধাশ্ৰমৰ শুভাৰম্ভ কৰা হয়"
|
|
45
|
+
expected: "lkhimpur jilār nārāẏṇpurr brpthārt āji prśānti dhām nāmērē ēkhn bṛddhāśrmr śubhārmbh krā hẏ"
|
|
46
|
+
|
|
47
|
+
map:
|
|
48
|
+
|
|
49
|
+
rules:
|
|
50
|
+
# note
|
|
51
|
+
- pattern: \u0982(?=[কখগঘঙ])
|
|
52
|
+
result: ṅ
|
|
53
|
+
- pattern: \u0982(?=[চছজঝঞ])
|
|
54
|
+
result: ñ
|
|
55
|
+
- pattern: \u0982(?=[টঠডড়ঢঢ়ণ])
|
|
56
|
+
result: ṇ
|
|
57
|
+
- pattern: \u0982(?=[তৎথদধন])
|
|
58
|
+
result: n
|
|
59
|
+
- pattern: \u0982(?=[পফবভম])
|
|
60
|
+
result: m
|
|
61
|
+
|
|
62
|
+
|
|
63
|
+
characters:
|
|
64
|
+
'অ': 'a'
|
|
65
|
+
'আ': 'ā'
|
|
66
|
+
'ই': 'i'
|
|
67
|
+
'ঈ': 'ī'
|
|
68
|
+
'উ': 'u'
|
|
69
|
+
'ঊ': 'ū'
|
|
70
|
+
'ৠ': 'ṛ'
|
|
71
|
+
'ঌ': 'ḻ'
|
|
72
|
+
'এ': 'ē'
|
|
73
|
+
'ঐ': 'ai'
|
|
74
|
+
'ও': 'ŏ'
|
|
75
|
+
'ঔ': 'au'
|
|
76
|
+
|
|
77
|
+
# Consonants
|
|
78
|
+
# Gutturals
|
|
79
|
+
'ক': 'k'
|
|
80
|
+
'খ': 'kh'
|
|
81
|
+
'গ': 'g'
|
|
82
|
+
'ঘ': 'gh'
|
|
83
|
+
'ঙ': 'ṅ'
|
|
84
|
+
|
|
85
|
+
# Palatals
|
|
86
|
+
'চ': 'c'
|
|
87
|
+
'ছ': 'ch'
|
|
88
|
+
'জ': 'j'
|
|
89
|
+
'ঝ': 'jh'
|
|
90
|
+
'ঞ': 'ñ'
|
|
91
|
+
|
|
92
|
+
# Cerebrals
|
|
93
|
+
'ট': 'ṭ'
|
|
94
|
+
'ঠ': 'ṭh'
|
|
95
|
+
'ড': 'ḍ'
|
|
96
|
+
'ড়': 'd̂'
|
|
97
|
+
'ঢ': 'ḍh'
|
|
98
|
+
'ঢ়': 'd̂h'
|
|
99
|
+
'ণ': 'ṇ'
|
|
100
|
+
|
|
101
|
+
# Dentals
|
|
102
|
+
'ত': 't'
|
|
103
|
+
'ৎ': 't'
|
|
104
|
+
'থ': 'th'
|
|
105
|
+
'দ': 'd'
|
|
106
|
+
'ধ': 'dh'
|
|
107
|
+
'ন': 'n'
|
|
108
|
+
|
|
109
|
+
# Labials
|
|
110
|
+
'প': 'p'
|
|
111
|
+
'ফ': 'ph'
|
|
112
|
+
'ব': 'b'
|
|
113
|
+
'ভ': 'bh'
|
|
114
|
+
'ম': 'm'
|
|
115
|
+
|
|
116
|
+
# Semivowels
|
|
117
|
+
'য': 'y'
|
|
118
|
+
'য়': 'ẏ'
|
|
119
|
+
'য়': 'ẏ'
|
|
120
|
+
'ৰ': 'r'
|
|
121
|
+
'ল': 'l'
|
|
122
|
+
'ৱ': 'v'
|
|
123
|
+
|
|
124
|
+
|
|
125
|
+
# Sibilants
|
|
126
|
+
'শ': 'ś'
|
|
127
|
+
'ষ': 'ṣ'
|
|
128
|
+
'স': 's'
|
|
129
|
+
|
|
130
|
+
|
|
131
|
+
# Aspirate
|
|
132
|
+
'হ': 'h'
|
|
133
|
+
|
|
134
|
+
# Chandrabindu
|
|
135
|
+
'ঁ': 'm'
|
|
136
|
+
|
|
137
|
+
# Bisarga
|
|
138
|
+
'ঃ ': 'ḥ'
|
|
139
|
+
|
|
140
|
+
# Anusvāra
|
|
141
|
+
'ং': 'ṃ'
|
|
142
|
+
|
|
143
|
+
# Medials # Needed for connecting constants
|
|
144
|
+
|
|
145
|
+
'\u09be': 'ā'
|
|
146
|
+
'\u09bf': 'i'
|
|
147
|
+
'\u09c0': 'ī'
|
|
148
|
+
'\u09c1': 'u'
|
|
149
|
+
'\u09c2': 'ū'
|
|
150
|
+
'\u09c3': 'ṛ'
|
|
151
|
+
'\u09c7': 'ē'
|
|
152
|
+
'\u09c8': 'ai'
|
|
153
|
+
'\u09cb': 'ŏ'
|
|
154
|
+
'\u09cc': 'au'
|
|
155
|
+
'\u09CD': '' # Used for joining
|
|
156
|
+
'्': ''
|
|
157
|
+
'़': ''
|
|
158
|
+
'।': '.'
|
|
159
|
+
"": ''# Used for joining
|
|
@@ -0,0 +1,156 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bis
|
|
3
|
+
id: 1991
|
|
4
|
+
language: iso-639-2:ben
|
|
5
|
+
source_script: Beng
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Indian script code for information interchange - ISCII - Bengali Romanization
|
|
8
|
+
#url:
|
|
9
|
+
creation_date: 1991
|
|
10
|
+
description: |
|
|
11
|
+
IS 13194 (1991): Indian script code for information
|
|
12
|
+
interchange - ISCII [LITD 20: Indian Language Technologies
|
|
13
|
+
and Products]
|
|
14
|
+
|
|
15
|
+
notes:
|
|
16
|
+
- |
|
|
17
|
+
Exception: Anusvāra is transliterated by:
|
|
18
|
+
|
|
19
|
+
a) ṅ before gutturals,
|
|
20
|
+
b) ñ before palatals,
|
|
21
|
+
c) ṇ before cerebrals,
|
|
22
|
+
d) n before dentals, and
|
|
23
|
+
e) m before labials.
|
|
24
|
+
|
|
25
|
+
tests:
|
|
26
|
+
- source: "টিকা"
|
|
27
|
+
expected: "ṭikā"
|
|
28
|
+
- source: "শুরু"
|
|
29
|
+
expected: "śuru"
|
|
30
|
+
- source: "করোনাভাইরাসের উপসর্গ রয়েছে এমন ভ্রমণকারীদের শনাক্ত করতেই এ ব্যবস্থা নেওয়া হয়"
|
|
31
|
+
expected: "krŏnābhāirāsēr upsrg rẏēchē ēmn bhrmṇkārīdēr śnākt krtēi ē bybsthā nēŏẏā hẏ"
|
|
32
|
+
- source: "চীন এ ভাইরাসের সংক্রমণ ছড়িয়ে পড়ার বিষয়টি নিশ্চিত করার পর এ অঞ্চলের দেশগুলো নিজেদের বন্দরগুলোতে নজরদারি শুরু করে"
|
|
33
|
+
expected: "cīn ē bhāirāsēr sṅkrmṇ chd̂iẏē pd̂ār biṣẏṭi niścit krār pr ē añclēr dēśgulŏ nijēdēr bndrgulŏtē njrdāri śuru krē"
|
|
34
|
+
- source: "আপনার কি মনে হয়, দক্ষিণ এশিয়ার দেশগুলো সফলভাবে এ সুযোগের সদ্ব্যবহার করতে পেরেছে?"
|
|
35
|
+
expected: "āpnār ki mnē hẏ, dkṣiṇ ēśiẏār dēśgulŏ sphlbhābē ē suyŏgēr sdbybhār krtē pērēchē?"
|
|
36
|
+
- source: "এরপর এ ভাইরাসের সংক্রমণ দক্ষিণ এশিয়ায় ছড়িয়ে পড়ার আগে এ অঞ্চলের দেশগুলো চলতি বছরের শুরুর দিকে মহামারি মোকাবিলায় কয়েক মাস সময় পেয়েছিল"
|
|
37
|
+
expected: "ērpr ē bhāirāsēr sṅkrmṇ dkṣiṇ ēśiẏāẏ chd̂iẏē pd̂ār āgē ē añclēr dēśgulŏ clti bchrēr śurur dikē mhāmāri mŏkābilāẏ kẏēk mās smẏ pēẏēchil"
|
|
38
|
+
- source: "ন্যূনতম শেয়ার না থাকলে ছাড়তেই হবে পরিচালক পদ"
|
|
39
|
+
expected: "nyūntm śēẏār nā thāklē chād̂tēi hbē pricālk pd"
|
|
40
|
+
- source: "বিজন কুমার শীলের ‘ওয়ার্ক পারমিট’ পেতে অনিশ্চয়তা"
|
|
41
|
+
expected: "bijn kumār śīlēr ‘ŏẏārk pārmiṭ’ pētē aniścẏtā"
|
|
42
|
+
- source: "বাংলাদেশে হার্ড ইমিউনিটি তৈরি হওয়ার তথ্য–প্রমাণ মেলেনি"
|
|
43
|
+
expected: "bāṃlādēśē hārḍ imiuniṭi tairi hŏẏār tthy–prmāṇ mēlēni"
|
|
44
|
+
- source: "চীনে গত বছর করোনাভাইরাসের মহামারির সূত্রপাত হয়"
|
|
45
|
+
expected: "cīnē gt bchr krŏnābhāirāsēr mhāmārir sūtrpāt hẏ"
|
|
46
|
+
map:
|
|
47
|
+
|
|
48
|
+
rules:
|
|
49
|
+
# note
|
|
50
|
+
- pattern: \u0982(?=[কখগঘঙ])
|
|
51
|
+
result: ṅ
|
|
52
|
+
- pattern: \u0982(?=[চছজঝঞ])
|
|
53
|
+
result: ñ
|
|
54
|
+
- pattern: \u0982(?=[টঠডড়ঢঢ়ণ])
|
|
55
|
+
result: ṇ
|
|
56
|
+
- pattern: \u0982(?=[তৎথদধন])
|
|
57
|
+
result: n
|
|
58
|
+
- pattern: \u0982(?=[পফবভম])
|
|
59
|
+
result: m
|
|
60
|
+
|
|
61
|
+
|
|
62
|
+
characters:
|
|
63
|
+
'অ': 'a'
|
|
64
|
+
'আ': 'ā'
|
|
65
|
+
'ই': 'i'
|
|
66
|
+
'ঈ': 'ī'
|
|
67
|
+
'উ': 'u'
|
|
68
|
+
'ঊ': 'ū'
|
|
69
|
+
'ৠ': 'ṛ'
|
|
70
|
+
'ঌ': 'ḻ'
|
|
71
|
+
'এ': 'ē'
|
|
72
|
+
'ঐ': 'ai'
|
|
73
|
+
'ও': 'ŏ'
|
|
74
|
+
'ঔ': 'au'
|
|
75
|
+
|
|
76
|
+
# II. Consonants (see Note 2)
|
|
77
|
+
# Gutturals
|
|
78
|
+
'ক': 'k'
|
|
79
|
+
'খ': 'kh'
|
|
80
|
+
'গ': 'g'
|
|
81
|
+
'ঘ': 'gh'
|
|
82
|
+
'ঙ': 'ṅ'
|
|
83
|
+
|
|
84
|
+
# Palatals
|
|
85
|
+
'চ': 'c'
|
|
86
|
+
'ছ': 'ch'
|
|
87
|
+
'জ': 'j'
|
|
88
|
+
'ঝ': 'jh'
|
|
89
|
+
'ঞ': 'ñ'
|
|
90
|
+
|
|
91
|
+
# Cerebrals
|
|
92
|
+
'ট': 'ṭ'
|
|
93
|
+
'ঠ': 'ṭh'
|
|
94
|
+
'ড': 'ḍ'
|
|
95
|
+
'ড়': 'd̂'
|
|
96
|
+
'ঢ': 'ḍh'
|
|
97
|
+
'ঢ়': 'd̂h'
|
|
98
|
+
'ণ': 'ṇ'
|
|
99
|
+
|
|
100
|
+
# Dentals
|
|
101
|
+
'ত': 't'
|
|
102
|
+
'ৎ': 't'
|
|
103
|
+
'থ': 'th'
|
|
104
|
+
'দ': 'd'
|
|
105
|
+
'ধ': 'dh'
|
|
106
|
+
'ন': 'n'
|
|
107
|
+
|
|
108
|
+
# Labials
|
|
109
|
+
'প': 'p'
|
|
110
|
+
'ফ': 'ph'
|
|
111
|
+
'ব': 'b'
|
|
112
|
+
'ভ': 'bh'
|
|
113
|
+
'ম': 'm'
|
|
114
|
+
|
|
115
|
+
# Semivowels
|
|
116
|
+
'য': 'y'
|
|
117
|
+
'য়': 'ẏ'
|
|
118
|
+
'য়': 'ẏ'
|
|
119
|
+
'র': 'r'
|
|
120
|
+
'ল': 'l'
|
|
121
|
+
|
|
122
|
+
# Sibilants
|
|
123
|
+
'শ': 'ś'
|
|
124
|
+
'ষ': 'ṣ'
|
|
125
|
+
'স': 's'
|
|
126
|
+
|
|
127
|
+
|
|
128
|
+
# Aspirate
|
|
129
|
+
'হ': 'h'
|
|
130
|
+
|
|
131
|
+
# Chandrabindu
|
|
132
|
+
'ঁ': 'm'
|
|
133
|
+
|
|
134
|
+
# Bisarga
|
|
135
|
+
'ঃ ': 'ḥ'
|
|
136
|
+
|
|
137
|
+
# Anusvāra
|
|
138
|
+
'ং': 'ṃ'
|
|
139
|
+
|
|
140
|
+
# Medials # Needed for connecting constants
|
|
141
|
+
|
|
142
|
+
'\u09be': 'ā'
|
|
143
|
+
'\u09bf': 'i'
|
|
144
|
+
'\u09c0': 'ī'
|
|
145
|
+
'\u09c1': 'u'
|
|
146
|
+
'\u09c2': 'ū'
|
|
147
|
+
'\u09c3': 'ṛ'
|
|
148
|
+
'\u09c7': 'ē'
|
|
149
|
+
'\u09c8': 'ai'
|
|
150
|
+
'\u09cb': 'ŏ'
|
|
151
|
+
'\u09cc': 'au'
|
|
152
|
+
'\u09CD': '' # Used for joining
|
|
153
|
+
'्': ''
|
|
154
|
+
'़': ''
|
|
155
|
+
'।': '.'
|
|
156
|
+
"": ''# Used for joining
|