interscript-maps 2.1.0 → 2.3.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +330 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-2012.imp +74 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -4
- data/maps/alalc-kat-Geok-Latn-2011.imp +31 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -13
- data/maps/alalc-kat-Geor-Latn-2011.imp +52 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +5 -5
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +5 -5
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
- data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +15 -15
- data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +16 -16
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
- data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -2
- data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -15
- data/maps/odni-fas-Arab-Latn-2015.imp +17 -17
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -21
- data/maps/odni-hin-Deva-Latn-2015.imp +26 -27
- data/maps/odni-kat-Geor-Latn-2015.imp +3 -5
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-srp-Cyrl-Latn-2005.imp +1 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +7 -9
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -22
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
- data/maps/ses-ara-Arab-Latn-1930.imp +17 -60
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +6 -6
- data/maps/un-ara-Arab-Latn-1972.imp +5 -5
- data/maps/un-ara-Arab-Latn-2017.imp +16 -16
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +2 -2
- data/maps/un-kan-Kana-Latn-2016.imp +2 -2
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +2 -2
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +2 -2
- data/maps/un-nep-Deva-Latn-2013.imp +2 -2
- data/maps/un-ori-Orya-Latn-1972.imp +2 -2
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +2 -2
- data/maps/un-sin-Sinh-Latn-1972.imp +16 -4
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +16 -16
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
- data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
- data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
- data/maps/var-mon-Mong-Latn-1930.imp +1 -1
- data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
- data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
- data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
- data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
- metadata +11 -1
@@ -4,12 +4,16 @@ metadata {
|
|
4
4
|
language: iso-639-2:ell
|
5
5
|
source_script: Grek
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Greek 1.0 (Phonetic transcription)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
9
|
creation_date: 1987
|
10
10
|
description: |
|
11
11
|
UNGEGN Romanization table for Greek: Phonetic transcription
|
12
12
|
|
13
|
+
UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of
|
14
|
+
Geographical Names. Writing Systems and Guides to Pronunciation Romanization
|
15
|
+
> Conversion of the Greek alphabet into Latin characters. Paper submitted by
|
16
|
+
Greece and Cyprus.
|
13
17
|
|
14
18
|
notes:
|
15
19
|
- Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: un
|
3
|
-
id: 1987-
|
3
|
+
id: 1987-ts
|
4
4
|
language: iso-639-2:ell
|
5
5
|
source_script: Grek
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Greek -- UNGEGN 4.0 (transcription)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
9
|
creation_date: 1987
|
10
10
|
description: |
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:guj
|
5
5
|
source_script: Gujr
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Gujarati -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_gu.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 2016
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Hindi -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_hi.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 2016
|
4
4
|
language: iso-639-2:kan
|
5
5
|
source_script: Kana
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Kannada -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_kn.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mal
|
5
5
|
source_script: Mlym
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Malayalam -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_ml.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 2016
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Marathi -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_mr.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -0,0 +1,119 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: id
|
3
|
+
id: 1977
|
4
|
+
language: iso-639-2:mkd
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: Romanization of Macedonian geographical names (1977)
|
8
|
+
url: https://www.eki.ee/wgrs/v2_2/rom1_mk.htm
|
9
|
+
creation_date: 1977
|
10
|
+
description: |
|
11
|
+
The United Nations recommended system was approved in 1977 (III/11), based on the romanization of the Serbo-Croatian and Macedonian Cyrillic alphabets that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution (Third United Nations Conference on the Standardization of Geographical Names. Athens, 17 August - 7 September 1977. Vol. I. Report of the Conference, pp. 29, 31).
|
12
|
+
The system is used in The former Yugoslav Republic of Macedonia (see e.g. Report of The former Yugoslav Republic of Macedonia. Seventh United Nations Conference on the Standardization of Geographical Names. New York, 13-22 January 1998. Document E/CONF.91/CRP.23) and in international cartographic products.
|
13
|
+
The Cyrillic alphabet is used. The romanization table is unambiguous and can be applied automatically. The system is on the whole reversible with the exception of the characters ѓ and ќ. These are romanized as g and k, respectively, before е and и. But also г and к are occasionally used before е and и, so, for example, the name Makedonija is reconstituted as Македонија, not Маќедонија in the Cyrillic source script.
|
14
|
+
}
|
15
|
+
|
16
|
+
tests {
|
17
|
+
test "Маќедонија", "Makedonija"
|
18
|
+
test "Општина Ердут", "Opština Erdut"
|
19
|
+
test "Општина Двор", "Opština Dvor"
|
20
|
+
test "ЛУЃЕ луѓе", "LUGE luge"
|
21
|
+
test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
|
22
|
+
test "ЌАРУВАЊЕ ќарување", "ĆARUVANJE ćaruvanje"
|
23
|
+
}
|
24
|
+
|
25
|
+
dependency "posix", import: true
|
26
|
+
|
27
|
+
stage {
|
28
|
+
sub "Ѓ", "G", after: any("ЕИеи")
|
29
|
+
sub "ѓ", "g", after: any("ЕИеи")
|
30
|
+
sub "Ќ", "K", after: any("ЕИеи")
|
31
|
+
sub "ќ", "k", after: any("ЕИеи")
|
32
|
+
|
33
|
+
# CHARACTERS
|
34
|
+
parallel {
|
35
|
+
sub "А", "A"
|
36
|
+
sub "Б", "B"
|
37
|
+
sub "В", "V"
|
38
|
+
sub "Г", "G"
|
39
|
+
sub "Д", "D"
|
40
|
+
sub "Ѓ", "Đ" # Đ
|
41
|
+
sub "Е", "E"
|
42
|
+
sub "Ж", "Ž" # Ž
|
43
|
+
sub "З", "Z"
|
44
|
+
sub "Ѕ", "Dz"
|
45
|
+
sub "И", "I"
|
46
|
+
sub "Ј", "J"
|
47
|
+
sub "К", "K"
|
48
|
+
sub "Л", "L"
|
49
|
+
sub "Љ", "Lj"
|
50
|
+
sub "М", "M"
|
51
|
+
sub "Н", "N"
|
52
|
+
sub "Њ", "Nj"
|
53
|
+
sub "О", "O"
|
54
|
+
sub "П", "P"
|
55
|
+
sub "Р", "R"
|
56
|
+
sub "С", "S"
|
57
|
+
sub "Т", "T"
|
58
|
+
sub "Ќ", "Ć" # Ć
|
59
|
+
sub "У", "U"
|
60
|
+
sub "Ф", "F"
|
61
|
+
sub "Х", "H"
|
62
|
+
sub "Ц", "C"
|
63
|
+
sub "Ч", "Č" # Č
|
64
|
+
sub "Џ", "Dž" # Dž
|
65
|
+
sub "Ш", "Š" # Š
|
66
|
+
sub "а", "a"
|
67
|
+
sub "б", "b"
|
68
|
+
sub "в", "v"
|
69
|
+
sub "г", "g"
|
70
|
+
sub "д", "d"
|
71
|
+
sub "ѓ", "đ" # đ
|
72
|
+
sub "е", "e"
|
73
|
+
sub "ж", "ž" # ž
|
74
|
+
sub "з", "z"
|
75
|
+
sub "ѕ", "dz"
|
76
|
+
sub "и", "i"
|
77
|
+
sub "ј", "j"
|
78
|
+
sub "к", "k"
|
79
|
+
sub "л", "l"
|
80
|
+
sub "љ", "lj"
|
81
|
+
sub "м", "m"
|
82
|
+
sub "н", "n"
|
83
|
+
sub "њ", "nj"
|
84
|
+
sub "о", "o"
|
85
|
+
sub "п", "p"
|
86
|
+
sub "р", "r"
|
87
|
+
sub "с", "s"
|
88
|
+
sub "т", "t"
|
89
|
+
sub "ќ", "ć" # ć
|
90
|
+
sub "у", "u"
|
91
|
+
sub "ф", "f"
|
92
|
+
sub "х", "h"
|
93
|
+
sub "ц", "c"
|
94
|
+
sub "ч", "č" # č
|
95
|
+
sub "џ", "dž" # dž
|
96
|
+
sub "ш", "š" # š
|
97
|
+
}
|
98
|
+
|
99
|
+
# POSTRULES
|
100
|
+
# rewritten by hand to work properly
|
101
|
+
# DZ
|
102
|
+
sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
|
103
|
+
sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
|
104
|
+
|
105
|
+
#LJ
|
106
|
+
sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
|
107
|
+
sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
|
108
|
+
|
109
|
+
#NJ
|
110
|
+
sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
|
111
|
+
sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
|
112
|
+
|
113
|
+
#DŽ
|
114
|
+
sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
|
115
|
+
sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
|
116
|
+
|
117
|
+
compose
|
118
|
+
}
|
119
|
+
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mon
|
5
5
|
source_script: Mong
|
6
6
|
destination_script: Latn
|
7
|
-
name: Mongolian
|
7
|
+
name: Romanization of Mongolian in China -- UNGEGN 4.0
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_mnc.htm
|
9
9
|
creation_date: 2013-09
|
10
10
|
description: |
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mon
|
5
5
|
source_script: Mong
|
6
6
|
destination_script: Latn
|
7
|
-
name: Mongolian
|
7
|
+
name: Romanization of Mongolian in China -- UNGEGN 4.0 (phonetic)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_mnc.htm
|
9
9
|
creation_date: 2013-09
|
10
10
|
description: |
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 1972
|
4
4
|
language: iso-639-2:nep
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Nepali (1972)
|
8
8
|
url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2010
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 2013
|
4
4
|
language: iso-639-2:nep
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Nepali (2013)
|
8
8
|
url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2013
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 1972
|
4
4
|
language: iso-639-2:ori
|
5
5
|
source_script: Orya
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Oriya (1972)
|
8
8
|
url: http://www.eki.ee/wgrs/v2_2/rom1_or.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2003
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:pan
|
5
5
|
source_script: Guru
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Panjabi -- UNGEGN 4.0 (1972)
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_pa.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -5,7 +5,7 @@ metadata {
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
6
6
|
source_script: Arab
|
7
7
|
destination_script: Latn
|
8
|
-
name: Persian
|
8
|
+
name: Romanization of Persian (1967)
|
9
9
|
url: http://www.eki.ee/wgrs/v2_2/rom1_fa.htm
|
10
10
|
creation_date: 1967
|
11
11
|
confirmation_date: 01-2003
|
@@ -130,20 +130,20 @@ stage {
|
|
130
130
|
|
131
131
|
# NOTE 1
|
132
132
|
# Sun letters
|
133
|
-
sub boundary + "\u0627\u0644\u062a", "ot t" # الت
|
134
|
-
sub boundary + "\u0627\u0644\u062b", "os̄ s̄" # الث
|
135
|
-
sub boundary + "\u0627\u0644\u062f", "od d" # الد
|
136
|
-
sub boundary + "\u0627\u0644\u0630", "oz̄ z̄" # الذ
|
137
|
-
sub boundary + "\u0627\u0644\u0631", "or r" # الر
|
138
|
-
sub boundary + "\u0627\u0644\u0632", "oz z" # الز
|
139
|
-
sub boundary + "\u0627\u0644\u0633", "os s" # الس
|
140
|
-
sub boundary + "\u0627\u0644\u0634", "osh sh" # الش
|
141
|
-
sub boundary + "\u0627\u0644\u0635", "oş ş" # الص
|
142
|
-
sub boundary + "\u0627\u0644\u0636", "oẕ ẕ" # الض
|
143
|
-
sub boundary + "\u0627\u0644\u0637", "oţ ţ" # الط
|
144
|
-
sub boundary + "\u0627\u0644\u0638", "oz̧ z̧" # الظ
|
145
|
-
sub boundary + "\u0627\u0644\u0644", "ol l" # الل
|
146
|
-
sub boundary + "\u0627\u0644\u0646", "on n" # الن
|
133
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ot t" # الت
|
134
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "os̄ s̄" # الث
|
135
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "od d" # الد
|
136
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "oz̄ z̄" # الذ
|
137
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "or r" # الر
|
138
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "oz z" # الز
|
139
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "os s" # الس
|
140
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "osh sh" # الش
|
141
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "oş ş" # الص
|
142
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "oẕ ẕ" # الض
|
143
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "oţ ţ" # الط
|
144
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "oz̧ z̧" # الظ
|
145
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ol l" # الل
|
146
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "on n" # الن
|
147
147
|
|
148
148
|
sub "\u0650\u064a\u0651", "īy" # ـِيَّ
|
149
149
|
sub "\u0650\u064a", "iy", after: any("\u064e\u064f") # ـِي kasra followed by ي
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
|
-
authority_id:
|
2
|
+
authority_id: un
|
3
3
|
id: 1987
|
4
4
|
language: iso-639-2:rus
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Russian (1987)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_ru.htm
|
9
9
|
creation_date: 1987
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,8 @@ metadata {
|
|
4
4
|
language: iso-639-2:sin
|
5
5
|
source_script: Sinh
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Sinhalese -- UNGEGN 4.0 (1972)
|
8
|
+
source: "Second United Nations Conference on the Standardization of Geographical Names. London, 10–31 May 1972. Vol. II. Technical papers, pp. 151–152."
|
8
9
|
url: https://www.eki.ee/wgrs/rom1_ml.htm
|
9
10
|
creation_date: 1972
|
10
11
|
confirmation_date: 2016
|
@@ -18,7 +19,6 @@ metadata {
|
|
18
19
|
Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
|
19
20
|
abbreviated form, to denote vowels after consonants.
|
20
21
|
|
21
|
-
|
22
22
|
notes:
|
23
23
|
- |
|
24
24
|
The character ඇ was romanized as a͝i and the character ඈ as ai in Sharma's table, but there was no romanization for the character ඓ which,
|
@@ -37,13 +37,13 @@ metadata {
|
|
37
37
|
|
38
38
|
tests {
|
39
39
|
test "ශී්ර ලංකාවේ කී්රඩාව ඉතිහාසයේ ඉහළම තැනකට ගේන්න කටයුතු කරනවා", "shīra laṁkāve kīraḍāva itihāsaye ihaḷama tæ̆nakaṭa genna kaṭayutu karanavā"
|
40
|
-
test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "
|
40
|
+
test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaṇḍae moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
|
41
41
|
test "ලෝක ළමා දිනයදා සිසුන් පිරිසක් කසිප්පු බීලා", "loka ḷamā dinayadā sisun pirisak kasippu bīlā"
|
42
42
|
test "කෝටි 16ක හෙරොයින් සමග දන්කොටුවේදී 7ක් දැලේ", "koṭi 16ka hĕrŏyin samaga dankŏṭuvedī 7k dæ̆le"
|
43
43
|
test "මිනුවන්ගොඩ පීසීආර් දෙදහසක් සිදුකරයි", "minuvangŏḍa pīsīār dĕdahasak sidukarayi"
|
44
44
|
test "පාස්කු ප්රහාරය වගේම පාස්කු ප්රෝඩාව ගැනත් සොයන්න කොමිසමක් පත්කළ යුතුයි - විපක්ෂ නායක සජිත් පේ්රමදාස", "pāsku parahāraya vagema pāsku proḍāva gæ̆nat sŏyanna kŏmisamak patkaḷa yutuyi - vipakṣha nāyaka sajit peramadāsa"
|
45
45
|
test "ට්රම්ප්ගේ සෞඛ්යය තීරණාත්මකයි - ට්විටර් හරහා ජනතාව අමතයි", "ṭarampge saukhyaya tīraṇātmakayi - ṭviṭar harahā janatāva amatayi"
|
46
|
-
test "පාස්කු දා ප්රහාරය පිළිබඳ පරීක්ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya
|
46
|
+
test "පාස්කු දා ප්රහාරය පිළිබඳ පරීක්ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibanda parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
|
47
47
|
test "දිල්ලි කැපිටල්ස් සහ කෝලිගේ බැංගලෝර් තෙවැනි ජය ලබයි", "dilli kæ̆piṭals saha kolige bæ̆ṁgalor tĕvæ̆ni jaya labayi"
|
48
48
|
test "ශ්රී ලාංකික සම්භවයක් සහිත ප්රංශයේ පවුලක 5 ක් ඝාතනය කරලා", "sharī lāṁkika sambhavayak sahita paraṁshaye pavulaka 5 k ghātanaya karalā"
|
49
49
|
test "පැතිකුදය ඉක්මනින් සුව කරන ප්රතිකාර", "pæ̆tikudaya ikmanin suva karana paratikāra"
|
@@ -171,6 +171,18 @@ stage {
|
|
171
171
|
sub "ෆ", "fa"
|
172
172
|
sub "ළ", "ḷa"
|
173
173
|
|
174
|
+
# Prenasalized sounds
|
175
|
+
sub "ඟ", "ṅga"
|
176
|
+
sub "ඦ", "ñja"
|
177
|
+
sub "ඬ", "ṇḍa"
|
178
|
+
sub "ඳ", "nda"
|
179
|
+
sub "ඹ", "mba"
|
180
|
+
|
181
|
+
# Other ligatures
|
182
|
+
sub "ක්", "k"
|
183
|
+
sub "ඥ", "jña"
|
184
|
+
sub "න්", "n"
|
185
|
+
|
174
186
|
# numbers
|
175
187
|
sub "\u0DE6", "0"
|
176
188
|
sub "\u0DE7", "1"
|
@@ -0,0 +1,47 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: un
|
3
|
+
id: 1997
|
4
|
+
language: iso-639-2:srp
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: Romanization of Serbo-Crotian (1972)
|
8
|
+
url: http://www.eki.ee/wgrs/rom1_sr.htm
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
The United Nations recommended system was approved in 1977 (III/11), based on the Roman equivalent of the Serbo-Croatian Cyrillic alphabet that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution1. The term relating to the language (Serbian instead of Serbo-Croatian) was modified in 2002 (resolution VIII/14).
|
12
|
+
The system is used in Serbia, Montenegro, and Bosnia and Herzegovina. It is also used in international cartographic products.
|
13
|
+
Serbian uses the Cyrillic script that is alphabetic. The romanization table is unambiguous and can be applied automatically. The system is reversible.
|
14
|
+
}
|
15
|
+
|
16
|
+
tests {
|
17
|
+
test "Шупља Стена", "Šuplja Stena"
|
18
|
+
test "Чукарица", "Čukarica"
|
19
|
+
test "Црна Трава", "Crna Trava"
|
20
|
+
test "Херцег Нови", "Herceg Novi"
|
21
|
+
test "Улцињ", "Ulcinj"
|
22
|
+
test "Ужице", "Užice"
|
23
|
+
test "Тресаначка Река", "Tresanačka Reka"
|
24
|
+
test "Сјеница", "Sjenica"
|
25
|
+
test "Рожаје", "Rožaje"
|
26
|
+
test "Пљевља", "Pljevlja"
|
27
|
+
test "Оџаци", "Odžaci"
|
28
|
+
test "Никшић", "Nikšić"
|
29
|
+
test "Медвеђа", "Medveđa"
|
30
|
+
test "Лозница", "Loznica"
|
31
|
+
test "Књажевац", "Knjaževac"
|
32
|
+
test "Зрењанин", "Zrenjanin"
|
33
|
+
test "Житорађа", "Žitorađa"
|
34
|
+
test "Ервеник", "Ervenik"
|
35
|
+
test "Доње Љупче", "Donje Ljupče"
|
36
|
+
test "Гусиње", "Gusinje"
|
37
|
+
test "ГУСИЊЕ", "GUSINJE"
|
38
|
+
test "Врњачка Бања", "Vrnjačka Banja"
|
39
|
+
test "Бијело Поље", "Bijelo Polje"
|
40
|
+
test "Алибунар", "Alibunar"
|
41
|
+
}
|
42
|
+
|
43
|
+
dependency "alalc-srp-Cyrl-Latn-2013", as: srpalatn
|
44
|
+
|
45
|
+
stage {
|
46
|
+
run map.srpalatn.stage.main
|
47
|
+
}
|