interscript-maps 2.1.0 → 2.3.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +330 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-2012.imp +74 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -4
- data/maps/alalc-kat-Geok-Latn-2011.imp +31 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -13
- data/maps/alalc-kat-Geor-Latn-2011.imp +52 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +5 -5
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +5 -5
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
- data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +15 -15
- data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +16 -16
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
- data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -2
- data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -15
- data/maps/odni-fas-Arab-Latn-2015.imp +17 -17
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -21
- data/maps/odni-hin-Deva-Latn-2015.imp +26 -27
- data/maps/odni-kat-Geor-Latn-2015.imp +3 -5
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-srp-Cyrl-Latn-2005.imp +1 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +7 -9
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -22
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
- data/maps/ses-ara-Arab-Latn-1930.imp +17 -60
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +6 -6
- data/maps/un-ara-Arab-Latn-1972.imp +5 -5
- data/maps/un-ara-Arab-Latn-2017.imp +16 -16
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +2 -2
- data/maps/un-kan-Kana-Latn-2016.imp +2 -2
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +2 -2
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +2 -2
- data/maps/un-nep-Deva-Latn-2013.imp +2 -2
- data/maps/un-ori-Orya-Latn-1972.imp +2 -2
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +2 -2
- data/maps/un-sin-Sinh-Latn-1972.imp +16 -4
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +16 -16
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
- data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
- data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
- data/maps/var-mon-Mong-Latn-1930.imp +1 -1
- data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
- data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
- data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
- data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
- metadata +11 -1
@@ -5,7 +5,7 @@ metadata {
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
6
6
|
source_script: Arab
|
7
7
|
destination_script: Latn
|
8
|
-
name:
|
8
|
+
name: National Romanization System for Afghanistan -- Yaghoubi (2007)
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693661/ROMANIZATION_FOR_AFGHANISTAN.pdf
|
10
10
|
creation_date: 2007
|
11
11
|
confirmation_date: 2017-11
|
@@ -379,20 +379,20 @@ stage {
|
|
379
379
|
|
380
380
|
|
381
381
|
# Sun letters
|
382
|
-
sub boundary + "\u0627\u0644\u062a", "at̄ t̄" # الت
|
383
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
384
|
-
sub boundary + "\u0627\u0644\u062f", "aḏ ḏ" # الد
|
385
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
386
|
-
sub boundary + "\u0627\u0644\u0631", "aṟ ṟ" # الر
|
387
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
388
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
389
|
-
sub boundary + "\u0627\u0644\u0634", "aš š" # الش
|
390
|
-
sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
|
391
|
-
sub boundary + "\u0627\u0644\u0636", "ad͟z d͟z" # الض
|
392
|
-
sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
|
393
|
-
sub boundary + "\u0627\u0644\u0638", "aẕ ẕ" # الظ
|
394
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
395
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
382
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at̄ t̄" # الت
|
383
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
384
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "aḏ ḏ" # الد
|
385
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
386
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "aṟ ṟ" # الر
|
387
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
388
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
389
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "aš š" # الش
|
390
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
|
391
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "ad͟z d͟z" # الض
|
392
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
|
393
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "aẕ ẕ" # الظ
|
394
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
395
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
396
396
|
|
397
397
|
# consonant characters
|
398
398
|
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: bgnpcgn
|
3
|
-
id:
|
3
|
+
id: 1968
|
4
4
|
language: iso-639-3:prs
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Pashto (1968)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693760/ROMANIZATION_OF_PASHTO.pdf
|
9
9
|
creation_date: 1968
|
10
10
|
confirmation_date: 2017-11
|
@@ -248,20 +248,20 @@ stage {
|
|
248
248
|
sub "\u0659", "ê"
|
249
249
|
|
250
250
|
# Sun letters
|
251
|
-
sub boundary + "\u0627\u0644\u062a", "ut t" # الت
|
252
|
-
sub boundary + "\u0627\u0644\u062b", "us̄ s̄" # الث
|
253
|
-
sub boundary + "\u0627\u0644\u062f", "ud d" # الد
|
254
|
-
sub boundary + "\u0627\u0644\u0630", "uz̄ z̄" # الذ
|
255
|
-
sub boundary + "\u0627\u0644\u0631", "ur r" # الر
|
256
|
-
sub boundary + "\u0627\u0644\u0632", "uz z" # الز
|
257
|
-
sub boundary + "\u0627\u0644\u0633", "us s" # الس
|
258
|
-
sub boundary + "\u0627\u0644\u0634", "ush sh" # الش
|
259
|
-
sub boundary + "\u0627\u0644\u0635", "uş ş" # الص
|
260
|
-
sub boundary + "\u0627\u0644\u0636", "uẕ ẕ" # الض
|
261
|
-
sub boundary + "\u0627\u0644\u0637", "uţ ţ" # الط
|
262
|
-
sub boundary + "\u0627\u0644\u0638", "uz̧ z̧" # الظ
|
263
|
-
sub boundary + "\u0627\u0644\u0644", "ul l" # الل
|
264
|
-
sub boundary + "\u0627\u0644\u0646", "un n" # الن
|
251
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ut t" # الت
|
252
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "us̄ s̄" # الث
|
253
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ud d" # الد
|
254
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "uz̄ z̄" # الذ
|
255
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ur r" # الر
|
256
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "uz z" # الز
|
257
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "us s" # الس
|
258
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ush sh" # الش
|
259
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "uş ş" # الص
|
260
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "uẕ ẕ" # الض
|
261
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "uţ ţ" # الط
|
262
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "uz̧ z̧" # الظ
|
263
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ul l" # الل
|
264
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "un n" # الن
|
265
265
|
|
266
266
|
sub "\u0626", "êy" # ئ
|
267
267
|
}
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ron
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Table of Correspondences for Moldovan (Cyrillic-Roman) (2002 Agreement)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816780/TABLE_OF_CORRESPONDENCES_FOR_MOLDOVAN.pdf
|
9
9
|
creation_date: 2002
|
10
10
|
confirmation_date: 2019
|
@@ -14,7 +14,7 @@ metadata {
|
|
14
14
|
and the current Roman alphabet. When Moldovan Roman-alphabet spellings are not available, this table
|
15
15
|
can be used to convert Moldovan Cyrillic spellings. It should be noted that Moldovan is little used as a
|
16
16
|
language label now, and is usually considered as Romanian.
|
17
|
-
|
17
|
+
|
18
18
|
notes:
|
19
19
|
- | # 1
|
20
20
|
This Roman-script form is used before e, i and iu.
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:rue
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Rusyn (2016)
|
8
8
|
url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20RUSYN.pdf
|
9
9
|
creation_date: 2016
|
10
10
|
confirmation_date: 2017
|
@@ -14,17 +14,17 @@ metadata {
|
|
14
14
|
The Rusyn alphabet is almost identical to the Ukrainian alphabet, but contains three characters not
|
15
15
|
present in the Ukrainian alphabet: ё, ы, and ъ. These letters are also absent from the alphabet used by
|
16
16
|
Pannonian Rusyn. This table applies to both dialects of Rusyn.
|
17
|
-
|
17
|
+
|
18
18
|
notes:
|
19
19
|
- |
|
20
20
|
The letters ё, ы, and ъ are present in the orthography of the Carpatho‐Rusyn variant of the Rusyn
|
21
21
|
language. This variant is predominant among Rusyn speakers in Ukraine, Poland, Slovakia, Hungary, and
|
22
22
|
Romania. The letters are absent from the orthography of Pannonian Rusyn, which is predominant in
|
23
23
|
Serbia and Croatia.
|
24
|
-
|
24
|
+
|
25
25
|
- |
|
26
26
|
Unicode for Latin‐script characters: Ž/ž (017D, 017E); Č/č (010C, 010D); Š/š (0160, 0161); ’ (0027).
|
27
|
-
|
27
|
+
|
28
28
|
- |
|
29
29
|
The Romanization columns show only lowercase forms but, when romanizing, uppercase and
|
30
30
|
lowercase Roman letters as appropriate should be used.
|
@@ -91,7 +91,7 @@ stage {
|
|
91
91
|
sub "Я", "Ya" # Я
|
92
92
|
sub "Ь", "'" # Ь => '
|
93
93
|
sub "Ъ", "'" # Ъ => '
|
94
|
-
|
94
|
+
|
95
95
|
sub "а", "a" # а
|
96
96
|
sub "б", "b" # б
|
97
97
|
sub "в", "v" # в
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:rus
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Russian (1947)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/807920/ROMANIZATION_OF_RUSSIAN.pdf
|
9
9
|
creation_date: 1947
|
10
10
|
confirmation_date: 2019-06
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:sme
|
5
5
|
source_script: Latn
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Roman-Script Spelling Convention of Northern Sami (North Lappish) (1984 Agreement)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693794/ROMAN-SCRIPT_SPELLING_CONVENTIONS.pdf
|
9
9
|
creation_date: 1984
|
10
10
|
|
@@ -4,15 +4,17 @@ metadata {
|
|
4
4
|
language: iso-639-2:srp
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Transliteration of Serbian Cyrillic
|
8
8
|
creation_date: 1962
|
9
9
|
confirmation_date: 1962
|
10
10
|
description: |
|
11
11
|
Serbo-Croatian, the official national language of Yugoslavia, is a single literary language.
|
12
|
+
|
12
13
|
In Serbian areas it is written in the cyrillic (Serbian) alphabet, while in Croatian areas it is
|
13
14
|
written in the roman (Croatian) alphabet.
|
14
|
-
|
15
|
-
|
15
|
+
|
16
|
+
Both the BGN and PCGN use the standard Croatian equivalents for formalizing the Serbian cyrillic
|
17
|
+
alphabet whenever romanized names are not available.
|
16
18
|
|
17
19
|
notes:
|
18
20
|
- The digraph dj(Dj) will occasionally be found as the Croatian equivalent of ђ(Ђ),
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:srp
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Table of Correspondences for Serbian (Cyrillic-Roman) (2005 Agreement)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816783/TABLE_OF_CORRESPONDENCES_FOR_SERBIAN.pdf
|
9
9
|
creation_date: 2005
|
10
10
|
confirmation_date: 2019-06
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:tat
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Table of Correspondences for Tatar (Cyrillic-Roman) (2007 Agreement)
|
8
8
|
url: https://geonames.nga.mil/gns/html/Romanization/TABLE%20OF%20CORRESPONDENCES%20FOR%20TATAR.pdf
|
9
9
|
creation_date: 2007
|
10
10
|
confirmation_date: 2017-11
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:tgk
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Tajik (1994)
|
8
8
|
url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20TAJIK.pdf
|
9
9
|
creation_date: 1994
|
10
10
|
confirmation_date: 2017-11
|
@@ -0,0 +1,511 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: bgnpcgn
|
3
|
+
id: 2007
|
4
|
+
language: iso-639-2:tir
|
5
|
+
source_script: Ethi
|
6
|
+
destination_script: Latn
|
7
|
+
name: Romanization of Tigrinya (2007)
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693783/ROMANIZATION_OF_TIGRINYA.pdf
|
9
|
+
creation_date: 2007
|
10
|
+
description: |
|
11
|
+
The BGN/PCGN system for Tigrinya is designed for use in romanizing
|
12
|
+
geographical names written in Tigrinya (Ge’ez) characters. The Roman letters
|
13
|
+
and letter combinations shown as ek’uivalents to the Tigrinya characters
|
14
|
+
reflect modern Tigrinya pronunciation, while taking into account some
|
15
|
+
conscious archaisms based on Ge’ez and liturgical practices.
|
16
|
+
|
17
|
+
notes:
|
18
|
+
- |
|
19
|
+
Where consonant character sequences give rise to the romanizations
|
20
|
+
k-h, n-y, z-h and s-h, a hyphen may be added between them to differentiate
|
21
|
+
those romanizations from the digraphs kh, ny, zh and sh.
|
22
|
+
|
23
|
+
- |
|
24
|
+
Where possible, consonant gemination should be reflected. Though not
|
25
|
+
evident from the Ge’ez script, this may be ascertained from a reference
|
26
|
+
source, such as the Tigrinya-English dictionary, Thomas Leiper Kane,
|
27
|
+
Dunwoody Press, Springfield, VA, 2000.
|
28
|
+
|
29
|
+
- |
|
30
|
+
An inventory of letter-diacritic combinations, with their Unicode
|
31
|
+
encoding, in addition to the unmodified letters of the basic Roman script
|
32
|
+
is:
|
33
|
+
All apostrophes appearing in romanization are U+2019, except as they
|
34
|
+
appear in row 21, which are U+2018.
|
35
|
+
Ĭ (U+012C) ĭ (U+012D)
|
36
|
+
Ḥ (U+0048+0323) ḥ (U+0068+0323)
|
37
|
+
|
38
|
+
- |
|
39
|
+
The Romanization column shows only lowercase forms but, when
|
40
|
+
romanizing, uppercase and lowercase Roman letters as appropriate should be
|
41
|
+
used.
|
42
|
+
|
43
|
+
- |
|
44
|
+
Table footnote 1. The 6th-order characters should be romanized either with
|
45
|
+
or without the letter ĭ, depending on pronunciation.
|
46
|
+
|
47
|
+
- |
|
48
|
+
Table footnote 2. Forms of the consonant character ሠ are understood to be
|
49
|
+
becoming obsolete in Tigrinya.
|
50
|
+
|
51
|
+
- |
|
52
|
+
Table footnote 3. The vowel characters in row 17 should be romanized with
|
53
|
+
the apostrophe unless appearing as a word-initial.
|
54
|
+
|
55
|
+
- |
|
56
|
+
Table footnote 4. Forms of the character አ are understood to be falling into
|
57
|
+
disuse in Tigrinya.
|
58
|
+
}
|
59
|
+
|
60
|
+
tests {
|
61
|
+
test "የዜግነት ክብር በ ኢትዮጵያችን ጸንቶ", "yeziegĭnetĭ kĭbĭrĭ be ’itĭyop’ĭyachĭnĭ ts’enĭto"
|
62
|
+
test "ታየ ሕዝባዊነት ዳር እስከዳር በርቶ", "taye ḥĭzĭbawinetĭ darĭ ’ĭsĭkedarĭ berĭto"
|
63
|
+
test "ለሰላም ለፍትህ ለሕዝቦች ነጻነት", "leselamĭ lefĭtĭhĭ leḥĭzĭbochĭ nets’anetĭ"
|
64
|
+
test "በእኩልነት በፍቅር ቆመናል ባንድነት", "be’ĭkulĭnetĭ befĭk’ĭrĭ k’omenalĭ banĭdĭnetĭ"
|
65
|
+
test "መሠረተ ፅኑ ሰብዕናን ያልሻርን", "meserete ts’ĭnu sebĭ‘ĭnanĭ yalĭsharĭnĭ"
|
66
|
+
test "ሕዝቦች ነን ለሥራ በሥራ የኖርን", "ḥĭzĭbochĭ nenĭ lesĭra besĭra yenorĭnĭ"
|
67
|
+
test "ድንቅ የባህል መድረክ ያኩሪ ቅርስ ባለቤት", "dĭnĭk’ĭ yebahĭlĭ medĭrekĭ yakuri k’ĭrĭsĭ balebietĭ"
|
68
|
+
test "የተፈጥሮ ጸጋ የጀግና ሕዝብ እናት", "yetefet’ĭro ts’ega yejegĭna ḥĭzĭbĭ ’ĭnatĭ"
|
69
|
+
test "እንጠብቅሻለን አለብን አደራ", "’ĭnĭt’ebĭk’ĭshalenĭ ’elebĭnĭ ’edera"
|
70
|
+
test "ኢትዮጵያችን ኑሪ እኛም ባንቺ እንኩራ", "’itĭyop’ĭyachĭnĭ nuri ’ĭnyamĭ banĭchi ’ĭnĭkura"
|
71
|
+
test "ቋንቋ የድምጽ, የምልክት ወይም የምስል ቅንብር ሆኖ", "k’wanĭk’wa yedĭmĭts’ĭ, yemĭlĭkĭtĭ weyĭmĭ yemĭsĭlĭ k’ĭnĭbĭrĭ hono"
|
72
|
+
test "ለማሰብ ወይም የታሰበን ሃሳብ ለሌላ ለማስተላለፍ የሚረዳ መሳሪያ ነው", "lemasebĭ weyĭmĭ yetasebenĭ hasabĭ leliela lemasĭtelalefĭ yemireda mesariya newĭ"
|
73
|
+
test "በአጭሩ ቋንቋ የምልክቶች ስርዓትና እኒህን ምልክቶች ለማቀናበር", "be’ech’ĭru k’wanĭk’wa yemĭlĭkĭtochĭ sĭrĭ‘atĭna ’ĭnihĭnĭ mĭlĭkĭtochĭ lemak’enaberĭ"
|
74
|
+
test "የሚያስፈልጉ ህጎች ጥንቅር ነው. ቋንቋወችን ለመፈረጅ እንዲሁም", "yemiyasĭfelĭgu hĭgochĭ t’ĭnĭk’ĭrĭ newĭ. k’wanĭk’wawechĭnĭ lemeferejĭ ’ĭnĭdihumĭ"
|
75
|
+
test "ለምክፈል የሚያስችሉ መስፈርቶችን ለማስቀመጥ ባለው ችግር", "lemĭkĭfelĭ yemiyasĭchĭlu mesĭferĭtochĭnĭ lemasĭk’emet’ĭ balewĭ chĭgĭrĭ"
|
76
|
+
test "ምክንያት በአሁኑ ሰዓት በርግጠኝነት ስንት ቋንቋ በዓለም ላይ", "mĭkĭnĭyatĭ be’ehunu se‘atĭ berĭgĭt’enyĭnetĭ sĭnĭtĭ k’wanĭk’wa be‘alemĭ layĭ"
|
77
|
+
test "እንዳለ ማወቅ አስቸጋሪ ነው", "’ĭnĭdale mawek’ĭ ’esĭchegari newĭ"
|
78
|
+
test "አሰላ", "’esela"
|
79
|
+
test "አሶሳ", "’esosa"
|
80
|
+
test "አንኮበር", "’enĭkoberĭ"
|
81
|
+
test "አክሱም", "’ekĭsumĭ"
|
82
|
+
test "አዋሳ", "’ewasa"
|
83
|
+
test "አዲስ ዘመን (ከተማ)", "’edisĭ zemenĭ (ketema)"
|
84
|
+
test "አዲግራት", "’edigĭratĭ"
|
85
|
+
test "አዳማ", "’edama"
|
86
|
+
test "ደምበጫ", "demĭbech’a"
|
87
|
+
test "ደርባ", "derĭba"
|
88
|
+
test "ደብረ ማርቆስ", "debĭre marĭk’osĭ"
|
89
|
+
test "ደብረ ብርሃን", "debĭre bĭrĭhanĭ"
|
90
|
+
test "ደብረ ታቦር (ከተማ)", "debĭre taborĭ (ketema)"
|
91
|
+
test "ደብረ ዘይት", "debĭre zeyĭtĭ"
|
92
|
+
test "ደገሃቡር", "degehaburĭ"
|
93
|
+
test "ወልቂጤ", "welĭk’it’ie"
|
94
|
+
test "ወልወል", "welĭwelĭ"
|
95
|
+
test "ወልደያ", "welĭdeya"
|
96
|
+
test "ናይሎ ሳህራን", "nayĭlo sahĭranĭ"
|
97
|
+
test "አኙዋክኛ", "’enyuwakĭnya"
|
98
|
+
test "ኡዱክኛ", "’udukĭnya"
|
99
|
+
test "ኦፓኛ", "’opanya"
|
100
|
+
test "ጉምዝኛ", "gumĭzĭnya"
|
101
|
+
test "አፋርኛ", "’efarĭnya"
|
102
|
+
test "አላባኛ", "’elabanya"
|
103
|
+
test "አርቦርኛ", "’erĭborĭnya"
|
104
|
+
test "ባይሶኛ", "bayĭsonya"
|
105
|
+
test "ቡሳኛ", "busanya"
|
106
|
+
test "ሁለተኛ ጥፋት ከገበያ ማንቀላፋት", "huletenya t’ĭfatĭ kegebeya manĭk’elafatĭ"
|
107
|
+
test "ሁሉም ከልኩ አያልፍም", "hulumĭ kelĭku ’eyalĭfĭmĭ"
|
108
|
+
test "አልሞት ባይ ተጋዳይ", "’elĭmotĭ bayĭ tegadayĭ"
|
109
|
+
test "ውርድ ከራሴ", "wĭrĭdĭ kerasie"
|
110
|
+
test "ፀጉር መሰንጠቅ", "ts’egurĭ mesenĭt’ek’ĭ"
|
111
|
+
test "ግንትር ፀሐይ", "gĭnĭtĭrĭ ts’eḥeyĭ"
|
112
|
+
test "በሬ ወለደ", "berie welede"
|
113
|
+
test "ራስ ሳይጠና ጉተና", "rasĭ sayĭt’ena gutena"
|
114
|
+
test "ለሆዴ ጠግቤ በልብሴ አንግቤ", "lehodie t’egĭbie belĭbĭsie ’enĭgĭbie"
|
115
|
+
test "ለልጅ ከሳቁለት ለውሻ ከሮጡለት", "lelĭjĭ kesak’uletĭ lewĭsha kerot’uletĭ"
|
116
|
+
test "መልካም ባል መጥፎ ሴት ይገራል", "melĭkamĭ balĭ met’ĭfo sietĭ yĭgeralĭ"
|
117
|
+
test "ሆድና ግንባር አይሸሸግም", "hodĭna gĭnĭbarĭ ’eyĭsheshegĭmĭ"
|
118
|
+
test "ቀሊል አማት ሲሶ በትር አላት", "k’elilĭ ’ematĭ siso betĭrĭ ’elatĭ"
|
119
|
+
test "ጨው ለራስህ ብለህ ጣፍጥ አለበለዚያ ድንጋይ ነው ብለው ይወረውሩሀል", "ch’ewĭ lerasĭhĭ bĭlehĭ t’afĭt’ĭ ’elebeleziya dĭnĭgayĭ newĭ bĭlewĭ yĭwerewĭruhelĭ"
|
120
|
+
test "ጀምሮ ይጨርሳል አልሞ ይተኩሳል", "jemĭro yĭch’erĭsalĭ ’elĭmo yĭtekusalĭ"
|
121
|
+
}
|
122
|
+
|
123
|
+
stage {
|
124
|
+
|
125
|
+
# CHARACTERS
|
126
|
+
parallel {
|
127
|
+
sub "\u1200", "he" # ሀ
|
128
|
+
sub "\u1201", "hu" # ሁ
|
129
|
+
sub "\u1202", "hi" # ሂ
|
130
|
+
sub "\u1203", "ha" # ሃ
|
131
|
+
sub "\u1204", "hie" # ሄ
|
132
|
+
sub "\u1205", any(["hĭ", "h"]) # ህ
|
133
|
+
sub "\u1206", "ho" # ሆ
|
134
|
+
|
135
|
+
sub "\u1208", "le" # ለ
|
136
|
+
sub "\u1209", "lu" # ሉ
|
137
|
+
sub "\u120A", "li" # ሊ
|
138
|
+
sub "\u120B", "la" # ላ
|
139
|
+
sub "\u120C", "lie" # ሌ
|
140
|
+
sub "\u120D", any(["lĭ", "l"]) # ል
|
141
|
+
sub "\u120E", "lo" # ሎ
|
142
|
+
|
143
|
+
sub "\u1210", "ḥe" # ሐ
|
144
|
+
sub "\u1211", "ḥu" # ሑ
|
145
|
+
sub "\u1212", "ḥi" # ሒ
|
146
|
+
sub "\u1213", "ḥa" # ሓ
|
147
|
+
sub "\u1214", "ḥie" # ሔ
|
148
|
+
sub "\u1215", any(["ḥĭ", "ḥ"]) # ሕ
|
149
|
+
sub "\u1216", "ḥo" # ሖ
|
150
|
+
|
151
|
+
sub "\u1218", "me" # መ
|
152
|
+
sub "\u1219", "mu" # ሙ
|
153
|
+
sub "\u121A", "mi" # ሚ
|
154
|
+
sub "\u121B", "ma" # ማ
|
155
|
+
sub "\u121C", "mie" # ሜ
|
156
|
+
sub "\u121D", any(["mĭ", "m"]) # ም
|
157
|
+
sub "\u121E", "mo" # ሞ
|
158
|
+
|
159
|
+
# TODO: NOTE 2:
|
160
|
+
# Where possible, consonant gemination should be reflected. Though not
|
161
|
+
# evident from the Ge’ez script, this may be ascertained from a reference
|
162
|
+
# source, such as the Tigrinya-English dictionary, Thomas Leiper Kane,
|
163
|
+
# Dunwoody Press, Springfield, VA, 2000.
|
164
|
+
sub "\u1220", "se" # ሠ
|
165
|
+
sub "\u1221", "su" # ሡ
|
166
|
+
sub "\u1222", "si" # ሢ
|
167
|
+
sub "\u1223", "sa" # ሣ
|
168
|
+
sub "\u1224", "sie" # ሤ
|
169
|
+
sub "\u1225", any(["sĭ", "s"]) # ሥ
|
170
|
+
sub "\u1226", "so" # ሦ
|
171
|
+
|
172
|
+
sub "\u1228", "re" # ረ
|
173
|
+
sub "\u1229", "ru" # ሩ
|
174
|
+
sub "\u122A", "ri" # ሪ
|
175
|
+
sub "\u122B", "ra" # ራ
|
176
|
+
sub "\u122C", "rie" # ሬ
|
177
|
+
sub "\u122D", any(["rĭ", "r"]) # ር
|
178
|
+
sub "\u122E", "ro" # ሮ
|
179
|
+
|
180
|
+
sub "\u1230", "se" # ሰ
|
181
|
+
sub "\u1231", "su" # ሱ
|
182
|
+
sub "\u1232", "si" # ሲ
|
183
|
+
sub "\u1233", "sa" # ሳ
|
184
|
+
sub "\u1234", "sie" # ሴ
|
185
|
+
sub "\u1235", any(["sĭ", "s"]) # ስ
|
186
|
+
sub "\u1236", "so" # ሶ
|
187
|
+
|
188
|
+
sub "\u1238", "she" # ሸ
|
189
|
+
sub "\u1239", "shu" # ሹ
|
190
|
+
sub "\u123A", "shi" # ሺ
|
191
|
+
sub "\u123B", "sha" # ሻ
|
192
|
+
sub "\u123C", "shie" # ሼ
|
193
|
+
sub "\u123D", any(["shĭ", "sh"]) # ሽ
|
194
|
+
sub "\u123E", "sho" # ሾ
|
195
|
+
|
196
|
+
sub "\u1240", "k’e" # ቀ
|
197
|
+
sub "\u1241", "k’u" # ቁ
|
198
|
+
sub "\u1242", "k’i" # ቂ
|
199
|
+
sub "\u1243", "k’a" # ቃ
|
200
|
+
sub "\u1244", "k’ie" # ቄ
|
201
|
+
sub "\u1245", any(["k’ĭ", "k’"]) # ቅ
|
202
|
+
sub "\u1246", "k’o" # ቆ
|
203
|
+
|
204
|
+
sub "\u1250", "kh’e" # ቐ
|
205
|
+
sub "\u1251", "kh’u" # ቑ
|
206
|
+
sub "\u1252", "kh’i" # ቒ
|
207
|
+
sub "\u1253", "kh’a" # ቓ
|
208
|
+
sub "\u1254", "kh’ie" # ቔ
|
209
|
+
sub "\u1255", any(["kh’ĭ", "kh’"]) # ቕ
|
210
|
+
sub "\u1256", "kh’o" # ቖ
|
211
|
+
|
212
|
+
sub "\u1260", "be" # በ
|
213
|
+
sub "\u1261", "bu" # ቡ
|
214
|
+
sub "\u1262", "bi" # ቢ
|
215
|
+
sub "\u1263", "ba" # ባ
|
216
|
+
sub "\u1264", "bie" # ቤ
|
217
|
+
sub "\u1265", any(["bĭ", "b"]) # ብ
|
218
|
+
sub "\u1266", "bo" # ቦ
|
219
|
+
|
220
|
+
sub "\u1270", "te" # ተ
|
221
|
+
sub "\u1271", "tu" # ቱ
|
222
|
+
sub "\u1272", "ti" # ቲ
|
223
|
+
sub "\u1273", "ta" # ታ
|
224
|
+
sub "\u1274", "tie" # ቴ
|
225
|
+
sub "\u1275", any(["tĭ", "t"]) # ት
|
226
|
+
sub "\u1276", "to" # ቶ
|
227
|
+
|
228
|
+
sub "\u1278", "che" # ቸ
|
229
|
+
sub "\u1279", "chu" # ቹ
|
230
|
+
sub "\u127A", "chi" # ቺ
|
231
|
+
sub "\u127B", "cha" # ቻ
|
232
|
+
sub "\u127C", "chie" # ቼ
|
233
|
+
sub "\u127D", any(["chĭ", "ch"]) # ች
|
234
|
+
sub "\u127E", "cho" # ቾ
|
235
|
+
|
236
|
+
sub "\u1280", "ḥe" # ኀ
|
237
|
+
sub "\u1281", "ḥu" # ኁ
|
238
|
+
sub "\u1282", "ḥi" # ኂ
|
239
|
+
sub "\u1283", "ḥa" # ኃ
|
240
|
+
sub "\u1284", "ḥie" # ኄ
|
241
|
+
sub "\u1285", any(["ḥĭ", "ḥ"]) # ኅ
|
242
|
+
sub "\u1286", "ḥo" # ኆ
|
243
|
+
|
244
|
+
sub "\u1290", "ne" # ነ
|
245
|
+
sub "\u1291", "nu" # ኑ
|
246
|
+
sub "\u1292", "ni" # ኒ
|
247
|
+
sub "\u1293", "na" # ና
|
248
|
+
sub "\u1294", "nie" # ኔ
|
249
|
+
sub "\u1295", any(["nĭ", "n"]) # ን
|
250
|
+
sub "\u1296", "no" # ኖ
|
251
|
+
|
252
|
+
sub "\u1298", "nye" # ኘ
|
253
|
+
sub "\u1299", "nyu" # ኙ
|
254
|
+
sub "\u129A", "nyi" # ኚ
|
255
|
+
sub "\u129B", "nya" # ኛ
|
256
|
+
sub "\u129C", "nyie" # ኜ
|
257
|
+
sub "\u129D", any(["nyĭ", "ny"]) # ኝ
|
258
|
+
sub "\u129E", "nyo" # ኞ
|
259
|
+
|
260
|
+
# NOTE 3 The vowel characters in row 17 should be romanized with the
|
261
|
+
# apostrophe unless appearing as a word-initial.
|
262
|
+
# NOTE 4 Forms of the character አ are understood to be falling into disuse
|
263
|
+
# in Tigrinya.
|
264
|
+
sub "\u12A0", "’e" # አ
|
265
|
+
sub "\u12A1", "’u" # ኡ
|
266
|
+
sub "\u12A2", "’i" # ኢ
|
267
|
+
sub "\u12A3", "’a" # ኣ
|
268
|
+
sub "\u12A4", "’ie" # ኤ
|
269
|
+
sub "\u12A5", any(["’ĭ", "ĭ"]) # እ
|
270
|
+
sub "\u12A6", "’o" # ኦ
|
271
|
+
|
272
|
+
sub "\u12A8", "ke" # ከ
|
273
|
+
sub "\u12A9", "ku" # ኩ
|
274
|
+
sub "\u12AA", "ki" # ኪ
|
275
|
+
sub "\u12AB", "ka" # ካ
|
276
|
+
sub "\u12AC", "kie" # ኬ
|
277
|
+
sub "\u12AD", any(["kĭ", "k"]) # ክ
|
278
|
+
sub "\u12AE", "ko" # ኮ
|
279
|
+
|
280
|
+
sub "\u12B8", "khe" # ኸ
|
281
|
+
sub "\u12B9", "khu" # ኹ
|
282
|
+
sub "\u12BA", "khi" # ኺ
|
283
|
+
sub "\u12BB", "kha" # ኻ
|
284
|
+
sub "\u12BC", "khie" # ኼ
|
285
|
+
sub "\u12BD", any(["khĭ", "kh"]) # ኽ
|
286
|
+
sub "\u12BE", "kho" # ኾ
|
287
|
+
|
288
|
+
sub "\u12C8", "we" # ወ
|
289
|
+
sub "\u12C9", "wu" # ዉ
|
290
|
+
sub "\u12CA", "wi" # ዊ
|
291
|
+
sub "\u12CB", "wa" # ዋ
|
292
|
+
sub "\u12CC", "wie" # ዌ
|
293
|
+
sub "\u12CD", any(["wĭ", "w"]) # ው
|
294
|
+
sub "\u12CE", "wo" # ዎ
|
295
|
+
|
296
|
+
sub "\u12D0", "‘e" # ዐ
|
297
|
+
sub "\u12D1", "‘u" # ዑ
|
298
|
+
sub "\u12D2", "‘i" # ዒ
|
299
|
+
sub "\u12D3", "‘a" # ዓ
|
300
|
+
sub "\u12D4", "‘ie" # ዔ
|
301
|
+
sub "\u12D5", any(["‘ĭ", "‘"]) # ዕ
|
302
|
+
sub "\u12D6", "‘o" # ዖ
|
303
|
+
|
304
|
+
sub "\u12D8", "ze" # ዘ
|
305
|
+
sub "\u12D9", "zu" # ዙ
|
306
|
+
sub "\u12DA", "zi" # ዚ
|
307
|
+
sub "\u12DB", "za" # ዛ
|
308
|
+
sub "\u12DC", "zie" # ዜ
|
309
|
+
sub "\u12DD", any(["zĭ", "z"]) # ዝ
|
310
|
+
sub "\u12DE", "zo" # ዞ
|
311
|
+
|
312
|
+
sub "\u12E0", "zhe" # ዠ
|
313
|
+
sub "\u12E1", "zhu" # ዡ
|
314
|
+
sub "\u12E2", "zhi" # ዢ
|
315
|
+
sub "\u12E3", "zha" # ዣ
|
316
|
+
sub "\u12E4", "zhie" # ዤ
|
317
|
+
sub "\u12E5", any(["zhĭ", "zh"]) # ዥ
|
318
|
+
sub "\u12E6", "zho" # ዦ
|
319
|
+
|
320
|
+
sub "\u12E8", "ye" # የ
|
321
|
+
sub "\u12E9", "yu" # ዩ
|
322
|
+
sub "\u12EA", "yi" # ዪ
|
323
|
+
sub "\u12EB", "ya" # ያ
|
324
|
+
sub "\u12EC", "yie" # ዬ
|
325
|
+
sub "\u12ED", any(["yĭ", "y"]) # ይ
|
326
|
+
sub "\u12EE", "yo" # ዮ
|
327
|
+
|
328
|
+
sub "\u12F0", "de" # ደ
|
329
|
+
sub "\u12F1", "du" # ዱ
|
330
|
+
sub "\u12F2", "di" # ዲ
|
331
|
+
sub "\u12F3", "da" # ዳ
|
332
|
+
sub "\u12F4", "die" # ዴ
|
333
|
+
sub "\u12F5", any(["dĭ", "d"]) # ድ
|
334
|
+
sub "\u12F6", "do" # ዶ
|
335
|
+
|
336
|
+
sub "\u1300", "je" # ጀ
|
337
|
+
sub "\u1301", "ju" # ጁ
|
338
|
+
sub "\u1302", "ji" # ጂ
|
339
|
+
sub "\u1303", "ja" # ጃ
|
340
|
+
sub "\u1304", "jie" # ጄ
|
341
|
+
sub "\u1305", any(["jĭ", "j"]) # ጅ
|
342
|
+
sub "\u1306", "jo" # ጆ
|
343
|
+
|
344
|
+
sub "\u1308", "ge" # ገ
|
345
|
+
sub "\u1309", "gu" # ጉ
|
346
|
+
sub "\u130A", "gi" # ጊ
|
347
|
+
sub "\u130B", "ga" # ጋ
|
348
|
+
sub "\u130C", "gie" # ጌ
|
349
|
+
sub "\u130D", any(["gĭ", "g"]) # ግ
|
350
|
+
sub "\u130E", "go" # ጎ
|
351
|
+
|
352
|
+
sub "\u1320", "t’e" # ጠ
|
353
|
+
sub "\u1321", "t’u" # ጡ
|
354
|
+
sub "\u1322", "t’i" # ጢ
|
355
|
+
sub "\u1323", "t’a" # ጣ
|
356
|
+
sub "\u1324", "t’ie" # ጤ
|
357
|
+
sub "\u1325", any(["t’ĭ", "t’"]) # ጥ
|
358
|
+
sub "\u1326", "t’o" # ጦ
|
359
|
+
|
360
|
+
sub "\u1328", "ch’e" # ጨ
|
361
|
+
sub "\u1329", "ch’u" # ጩ
|
362
|
+
sub "\u132A", "ch’i" # ጪ
|
363
|
+
sub "\u132B", "ch’a" # ጫ
|
364
|
+
sub "\u132C", "ch’ie" # ጬ
|
365
|
+
sub "\u132D", any(["ch’ĭ", "ch’"]) # ጭ
|
366
|
+
sub "\u132E", "ch’o" # ጮ
|
367
|
+
|
368
|
+
sub "\u1330", "p’e" # ጰ
|
369
|
+
sub "\u1331", "p’u" # ጱ
|
370
|
+
sub "\u1332", "p’i" # ጲ
|
371
|
+
sub "\u1333", "p’a" # ጳ
|
372
|
+
sub "\u1334", "p’ie" # ጴ
|
373
|
+
sub "\u1335", any(["p’ĭ", "p’"]) # ጵ
|
374
|
+
sub "\u1336", "p’o" # ጶ
|
375
|
+
|
376
|
+
sub "\u1338", "ts’e" # ጸ
|
377
|
+
sub "\u1339", "ts’u" # ጹ
|
378
|
+
sub "\u133A", "ts’i" # ጺ
|
379
|
+
sub "\u133B", "ts’a" # ጻ
|
380
|
+
sub "\u133C", "ts’ie" # ጼ
|
381
|
+
sub "\u133D", any(["ts’ĭ", "ts’"]) # ጽ
|
382
|
+
sub "\u133E", "ts’o" # ጾ
|
383
|
+
|
384
|
+
sub "\u1340", "ts’e" # ፀ
|
385
|
+
sub "\u1341", "ts’u" # ፁ
|
386
|
+
sub "\u1342", "ts’i" # ፂ
|
387
|
+
sub "\u1343", "ts’a" # ፃ
|
388
|
+
sub "\u1344", "ts’ie" # ፄ
|
389
|
+
sub "\u1345", any(["ts’ĭ", "ts’"]) # ፅ
|
390
|
+
sub "\u1346", "ts’o" # ፆ
|
391
|
+
|
392
|
+
sub "\u1348", "fe" # ፈ
|
393
|
+
sub "\u1349", "fu" # ፉ
|
394
|
+
sub "\u134A", "fi" # ፊ
|
395
|
+
sub "\u134B", "fa" # ፋ
|
396
|
+
sub "\u134C", "fie" # ፌ
|
397
|
+
sub "\u134D", any(["fĭ", "f"]) # ፍ
|
398
|
+
sub "\u134E", "fo" # ፎ
|
399
|
+
|
400
|
+
sub "\u1350", "pe" # ፐ
|
401
|
+
sub "\u1351", "pu" # ፑ
|
402
|
+
sub "\u1352", "pi" # ፒ
|
403
|
+
sub "\u1353", "pa" # ፓ
|
404
|
+
sub "\u1354", "pie" # ፔ
|
405
|
+
sub "\u1355", any(["pĭ", "p"]) # ፕ
|
406
|
+
sub "\u1356", "po" # ፖ
|
407
|
+
|
408
|
+
sub "\u1268", "ve" # ቨ
|
409
|
+
sub "\u1269", "vu" # ቩ
|
410
|
+
sub "\u126A", "vi" # ቪ
|
411
|
+
sub "\u126B", "va" # ቫ
|
412
|
+
sub "\u126C", "vie" # ቬ
|
413
|
+
sub "\u126D", any(["vĭ", "v"]) # ቭ
|
414
|
+
sub "\u126E", "vo" # ቮ
|
415
|
+
|
416
|
+
# Combinations with W (Labialized Consonants)
|
417
|
+
|
418
|
+
sub "\u1248", "k’we" # ቈ
|
419
|
+
sub "\u124a", "k’wi" # ቊ
|
420
|
+
sub "\u124b", "k’wa" # ቋ
|
421
|
+
sub "\u124c", "k’wie" # ቌ
|
422
|
+
sub "\u124d", any(["k’wĭ", "k’w"]) # ቍ
|
423
|
+
|
424
|
+
sub "\u1288", "ḥwe" # ኈ
|
425
|
+
sub "\u128a", "ḥwi" # ኊ
|
426
|
+
sub "\u128b", "ḥwa" # ኋ
|
427
|
+
sub "\u128c", "ḥwie" # ኌ
|
428
|
+
sub "\u128d", any(["ḥwĭ", "ḥw"]) # ኍ
|
429
|
+
|
430
|
+
sub "\u12b0", "kwe" # ኰ
|
431
|
+
sub "\u12b2", "kwi" # ኲ
|
432
|
+
sub "\u12b3", "kwa" # ኳ
|
433
|
+
sub "\u12b4", "kwie" # ኴ
|
434
|
+
sub "\u12b5", any(["kwĭ", "kw"]) # ኵ
|
435
|
+
|
436
|
+
sub "\u1310", "gwe" # ጐ
|
437
|
+
sub "\u1312", "gwi" # ጒ
|
438
|
+
sub "\u1313", "gwa" # ጓ
|
439
|
+
sub "\u1314", "gwie" # ጔ
|
440
|
+
sub "\u1315", any(["gwĭ", "gw"]) # ጕ
|
441
|
+
|
442
|
+
sub "\u12c0", "khwe" # ዀ
|
443
|
+
sub "\u12c2", "khwi" # ዂ
|
444
|
+
sub "\u12c3", "khwa" # ዃ
|
445
|
+
sub "\u12c4", "khwie" # ዄ
|
446
|
+
sub "\u12c5", any(["khwĭ", "khw"]) # ዅ
|
447
|
+
|
448
|
+
sub "\u1258", "kh’e" # ቘ
|
449
|
+
sub "\u125a", "kh’i" # ቚ
|
450
|
+
sub "\u125b", "kh’a" # ቛ
|
451
|
+
sub "\u125c", "kh’ie" # ቜ
|
452
|
+
sub "\u125d", any(["kh’ĭ", "kh’"]) # ቝ
|
453
|
+
|
454
|
+
sub "\u120f", "lwa" # ሏ
|
455
|
+
sub "\u121f", "mwa" # ሟ
|
456
|
+
sub "\u122f", "rwa" # ሯ
|
457
|
+
sub "\u1237", "swa" # ሷ
|
458
|
+
sub "\u123f", "shwa" # ሿ
|
459
|
+
sub "\u1267", "bwa" # ቧ
|
460
|
+
sub "\u1277", "twa" # ቷ
|
461
|
+
sub "\u127f", "chwa" # ቿ
|
462
|
+
|
463
|
+
sub "\u1297", "nwa" # ኗ
|
464
|
+
sub "\u129f", "nywa" # ኟ
|
465
|
+
sub "\u12df", "zwa" # ዟ
|
466
|
+
sub "\u12e7", "zhwa" # ዧ
|
467
|
+
sub "\u12f7", "dwa" # ዷ
|
468
|
+
sub "\u1307", "jwa" # ጇ
|
469
|
+
sub "\u1327", "t’wa" # ጧ
|
470
|
+
sub "\u132f", "ch’wa" # ጯ
|
471
|
+
sub "\u133f", "ts’wa" # ጿ
|
472
|
+
sub "\u134f", "fwa" # ፏ
|
473
|
+
|
474
|
+
# Numerals
|
475
|
+
|
476
|
+
sub "\u1369", "1" # ፩
|
477
|
+
sub "\u136A", "2" # ፪
|
478
|
+
sub "\u136B", "3" # ፫
|
479
|
+
sub "\u136C", "4" # ፬
|
480
|
+
sub "\u136D", "5" # ፭
|
481
|
+
sub "\u136E", "6" # ፮
|
482
|
+
sub "\u136F", "7" # ፯
|
483
|
+
sub "\u1370", "8" # ፰
|
484
|
+
sub "\u1371", "9" # ፱
|
485
|
+
sub "\u1372", "10" # ፲
|
486
|
+
sub "\u1372\u1369", "11" # ፲፩
|
487
|
+
sub "\u1373", "20" # ፳
|
488
|
+
sub "\u1373\u1369", "21" # ፳፩
|
489
|
+
sub "\u1374", "30" # ፴
|
490
|
+
sub "\u1375", "40" # ፵
|
491
|
+
sub "\u1376", "50" # ፶
|
492
|
+
sub "\u1377", "60" # ፷
|
493
|
+
sub "\u1379", "80" # ፹
|
494
|
+
sub "\u137A", "90" # ፺
|
495
|
+
sub "\u137B", "100" # ፻
|
496
|
+
|
497
|
+
# These two rules are not defined in the sytsem.
|
498
|
+
# sub "\u1372\u137B", "1000" # ፲፻
|
499
|
+
# sub "\u137B\u137B", "10000" # ፻፻
|
500
|
+
|
501
|
+
# Punctuation
|
502
|
+
|
503
|
+
sub "፡", " " # Word Break (space)
|
504
|
+
sub "፣", "," # Comma
|
505
|
+
sub "፤", ";" # Semicolon
|
506
|
+
sub "።", "." # Period
|
507
|
+
|
508
|
+
}
|
509
|
+
|
510
|
+
}
|
511
|
+
|