interscript-maps 2.2.0 → 2.2.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ara
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Arabic -- UNGEGN (2017)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_ar.pdf
|
9
9
|
creation_date: 2017
|
10
10
|
confirmation_date: 2018-06
|
@@ -141,20 +141,20 @@ stage {
|
|
141
141
|
# (B) Marks doubling of the consonant.
|
142
142
|
|
143
143
|
# Sun letters
|
144
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
145
|
-
sub boundary + "\u0627\u0644\u062b", "ath th" # الث
|
146
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
147
|
-
sub boundary + "\u0627\u0644\u0630", "adh dh" # الذ
|
148
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
149
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
150
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
151
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
152
|
-
sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
|
153
|
-
sub boundary + "\u0627\u0644\u0636", "aḏ ḏ" # الض
|
154
|
-
sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
|
155
|
-
sub boundary + "\u0627\u0644\u0638", "ad͟h d͟h" # الظ
|
156
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
157
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
144
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
145
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "ath th" # الث
|
146
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
147
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "adh dh" # الذ
|
148
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
149
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
150
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
151
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
152
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
|
153
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḏ ḏ" # الض
|
154
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
|
155
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "ad͟h d͟h" # الظ
|
156
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
157
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
158
158
|
|
159
159
|
# TODO: shorten this fragment
|
160
160
|
# ta' marboota
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ben
|
5
5
|
source_script: Beng
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Assamese -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_as.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:bel
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Belarusian geographic names (2007)
|
8
8
|
url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/crp/9th_UNCSGN_e-conf-98-crp-21.pdf
|
9
9
|
creation_date: 2007
|
10
10
|
description: |
|
@@ -16,7 +16,7 @@ metadata {
|
|
16
16
|
Republic of Belarus in letters of the Latin alphabet
|
17
17
|
|
18
18
|
Based on the Regulation on the State Property Committee of the Republic of Belarus,
|
19
|
-
approved by the Decree of the Council of Ministers of the Republic of
|
19
|
+
approved by the Decree of the Council of Ministers of the Republic of Belarus dated July 29, 2006
|
20
20
|
No. 958 "Issues of the State Committee on Property of the Republic of Belarus"
|
21
21
|
}
|
22
22
|
|
@@ -0,0 +1,197 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: un
|
3
|
+
id: 1977
|
4
|
+
language: iso-639-2:bul
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: Romanization of Bulgarian geographical names (1977)
|
8
|
+
url: https://www.eki.ee/wgrs/res/res_3_10.htm
|
9
|
+
creation_date: 1977
|
10
|
+
description: |
|
11
|
+
The System of Transliteration and Transcription of Bulgarian Geographical Names into Roman letters,
|
12
|
+
as shown in the annex below, be adopted as the international system for the romanization of Bulgarian geographical names.
|
13
|
+
}
|
14
|
+
|
15
|
+
tests {
|
16
|
+
test "нунатак Абрит", "nunatak Abrit"
|
17
|
+
test "връх Академия", "vrǎh Akademiya"
|
18
|
+
test "връх Ами Буе", "vrǎh Ami Bue"
|
19
|
+
test "нос Айтос", "nos Ajtos"
|
20
|
+
test "залив Баба Тонка", "zaliv Baba Tonka"
|
21
|
+
test "Балабански камък", "Balabanski kamǎk"
|
22
|
+
test "Бедечки поток", "Bedečki potok"
|
23
|
+
test "нос Бяга БЯГА", "nos Byaga BYAGA"
|
24
|
+
test "остров Качо", "ostrov Kačo" # wiki ostrov Cacho
|
25
|
+
test "Чакъров остров", "Čakǎrov ostrov"
|
26
|
+
test "връх Дъбник", "vrǎh Dǎbnik"
|
27
|
+
test "залив Десислава", "zaliv Desislava"
|
28
|
+
test "ледник Джераси", "lednik Džerasi"
|
29
|
+
test "Джегова скала", "Džegova skala"
|
30
|
+
test "Нунатак Едуард", "Nunatak Eduard"
|
31
|
+
test "Елховска седловина", "Elhovska sedlovina"
|
32
|
+
test "ледник Етър", "lednik Etǎr"
|
33
|
+
test "нунатак Филип Тотю", "nunatak Filip Totyu"
|
34
|
+
test "ледник Габаре", "lednik Gabare"
|
35
|
+
test "риф Гергини", "rif Gergini"
|
36
|
+
test "Гяуров връх", "Gyaurov vrǎh"
|
37
|
+
test "Гуцалски рид", "Gucalski rid" # not found
|
38
|
+
test "Хараламбиев остров", "Haralambiev ostrov"
|
39
|
+
test "връх Ичера", "vrǎh Ičera"
|
40
|
+
test "полуостров Йоан Павел II", "poluostrov Joan Pavel II"
|
41
|
+
test "нос Иван Александър", "nos Ivan Aleksandǎr"
|
42
|
+
test "нос Иречек", "nos Ireček"
|
43
|
+
test "нос Кърджали", "nos Kǎrdžali"
|
44
|
+
test "седловина Кърнаре", "sedlovina Kǎrnare"
|
45
|
+
test "нунатак Керсеблепт", "nunatak Kerseblept"
|
46
|
+
test "Кондофрейски възвишения", "Kondofrejski vǎzvišeniya"
|
47
|
+
test "Костинбродски проход", "Kostinbrodski prohod"
|
48
|
+
test "връх Кожух", "vrǎh Kožuh"
|
49
|
+
test "Кукерски нунатаци", "Kukerski nunataci"
|
50
|
+
test "залив Лазурен бряг", "zaliv Lazuren bryag"
|
51
|
+
test "връх Лудогорие", "vrǎh Ludogorie"
|
52
|
+
test "Лютибродски скали", "Lyutibrodski skali"
|
53
|
+
test "Масларов нунатак", "Maslarov nunatak"
|
54
|
+
test "Михневски връх", "Mihnevski vrǎh"
|
55
|
+
test "рид Митино", "rid Mitino"
|
56
|
+
test "езеро Наяда", "ezero Nayada"
|
57
|
+
test "нос Никюп НИКЮП", "nos Nikyup NIKYUP"
|
58
|
+
test "рид Оборище ОБОРИЩЕ", "rid Oborište OBORIŠTE"
|
59
|
+
test "залив Олуша", "zaliv Oluša"
|
60
|
+
test "Оряховски възвишения", "Oryahovski vǎzvišeniya"
|
61
|
+
test "нунатак Памидово", "nunatak Pamidovo"
|
62
|
+
test "връх Парангалица", "vrǎh Parangalica"
|
63
|
+
test "Първомайски провлак", "Pǎrvomajski provlak"
|
64
|
+
test "ледник Патлейна", "lednik Patlejna"
|
65
|
+
test "полуостров Перник", "poluostrov Pernik"
|
66
|
+
test "връх Петко Войвода", "vrǎh Petko Vojvoda"
|
67
|
+
test "остров Фанагория", "ostrov Fanagoriya"
|
68
|
+
test "нос Плас", "nos Plas"
|
69
|
+
test "Пресиянов рид", "Presiyanov rid"
|
70
|
+
test "връх Принсипе де Астуриас", "vrǎh Prinsipe de Asturias" # wiki: vrǎh Príncipe de Asturias
|
71
|
+
test "нунатак Ръченица", "nunatak Rǎčenica"
|
72
|
+
test "връх Райна Княгиня", "vrǎh Rajna Knyaginya"
|
73
|
+
test "Рид Ръжана", "Rid Rǎžana"
|
74
|
+
test "връх Ригс", "vrǎh Rigs"
|
75
|
+
test "остров Рогулят", "ostrov Rogulyat"
|
76
|
+
test "ледник Сабазий", "lednik Sabazij"
|
77
|
+
test "ледник Съединение", "lednik Sǎedinenie"
|
78
|
+
test "нунатак Сенокос", "nunatak Senokos"
|
79
|
+
test "Сейдолски камък", "Sejdolski kamǎk"
|
80
|
+
test "ледник Щерна", "lednik Šterna"
|
81
|
+
test "връх Шишман", "vrǎh Šišman"
|
82
|
+
test "ледник Сигмен", "lednik Sigmen"
|
83
|
+
test "Седловина Синитово", "Sedlovina Sinitovo"
|
84
|
+
test "Ледник Скаплизо", "Lednik Skaplizo"
|
85
|
+
test "залив Слънчев бряг", "zaliv Slǎnčev bryag"
|
86
|
+
test "остров Соатрис", "ostrov Soatris"
|
87
|
+
test "планина Софийски Университет", "planina Sofijski Universitet"
|
88
|
+
test "ледник Сребърна", "lednik Srebǎrna"
|
89
|
+
test "Средногорски възвишения", "Srednogorski vǎzvišeniya"
|
90
|
+
test "Св. Евтимиев камък", "Sv. Evtimiev kamǎk"
|
91
|
+
test "база Св. Климент Охридски", "baza Sv. Kliment Ohridski"
|
92
|
+
test "връх Стъргел", "vrǎh Stǎrgel"
|
93
|
+
test "нунатак Сторгозия", "nunatak Storgoziya" # nunatak Storgozia according to wiki
|
94
|
+
test "нунатак Сурвакари", "nunatak Survakari"
|
95
|
+
test "ледник Световрачене", "lednik Svetovračene"
|
96
|
+
test "остров Теменуга", "ostrov Temenuga"
|
97
|
+
test "Тракийски възвишения", "Trakijski vǎzvišeniya"
|
98
|
+
test "хълм Цамблак", "hǎlm Camblak"
|
99
|
+
test "ледник Урдовиза", "lednik Urdoviza"
|
100
|
+
test "остров Вълчедръм", "ostrov Vǎlčedrǎm"
|
101
|
+
test "острови Вардим", "ostrovi Vardim"
|
102
|
+
test "Владигеров проток", "Vladigerov protok"
|
103
|
+
test "ледник Ябланица", "lednik Yablanica"
|
104
|
+
test "залив Ямфорина", "zaliv Yamforina"
|
105
|
+
test "Йовков нос", "Jovkov nos"
|
106
|
+
test "рид Заберново", "rid Zabernovo"
|
107
|
+
test "ледник Збелсурд", "lednik Zbelsurd"
|
108
|
+
test "Жефарович камък", "Žefarovič kamǎk"
|
109
|
+
test "връх Зиези", "vrǎh Ziezi"
|
110
|
+
test "залив Златни пясъци", "zaliv Zlatni pyasǎci"
|
111
|
+
test "ледник Злокучене", "lednik Zlokučene"
|
112
|
+
test "проток Злогош", "protok Zlogoš"
|
113
|
+
}
|
114
|
+
|
115
|
+
dependency "posix", import: true
|
116
|
+
|
117
|
+
stage {
|
118
|
+
|
119
|
+
# CHARACTERS
|
120
|
+
parallel {
|
121
|
+
sub "А", "A"
|
122
|
+
sub "Б", "B"
|
123
|
+
sub "В", "V"
|
124
|
+
sub "Г", "G"
|
125
|
+
sub "Д", "D"
|
126
|
+
sub "Е", "E"
|
127
|
+
sub "Ж", "Ž"
|
128
|
+
sub "З", "Z"
|
129
|
+
sub "И", "I"
|
130
|
+
sub "Й", "J"
|
131
|
+
sub "К", "K"
|
132
|
+
sub "Л", "L"
|
133
|
+
sub "М", "M"
|
134
|
+
sub "Н", "N"
|
135
|
+
sub "О", "O"
|
136
|
+
sub "П", "P"
|
137
|
+
sub "Р", "R"
|
138
|
+
sub "С", "S"
|
139
|
+
sub "Т", "T"
|
140
|
+
sub "У", "U"
|
141
|
+
sub "Ф", "F"
|
142
|
+
sub "Х", "H"
|
143
|
+
sub "Ц", "C"
|
144
|
+
sub "Ч", "Č"
|
145
|
+
sub "Ш", "Š"
|
146
|
+
sub "Щ", "Št"
|
147
|
+
sub "Ъ", "Ǎ"
|
148
|
+
sub "Ь", "J"
|
149
|
+
sub "Ю", "Yu"
|
150
|
+
sub "Я", "Ya"
|
151
|
+
|
152
|
+
sub "а", "a"
|
153
|
+
sub "б", "b"
|
154
|
+
sub "в", "v"
|
155
|
+
sub "г", "g"
|
156
|
+
sub "д", "d"
|
157
|
+
sub "е", "e"
|
158
|
+
sub "ж", "ž"
|
159
|
+
sub "з", "z"
|
160
|
+
sub "и", "i"
|
161
|
+
sub "й", "j"
|
162
|
+
sub "к", "k"
|
163
|
+
sub "л", "l"
|
164
|
+
sub "м", "m"
|
165
|
+
sub "н", "n"
|
166
|
+
sub "о", "o"
|
167
|
+
sub "п", "p"
|
168
|
+
sub "р", "r"
|
169
|
+
sub "с", "s"
|
170
|
+
sub "т", "t"
|
171
|
+
sub "у", "u"
|
172
|
+
sub "ф", "f"
|
173
|
+
sub "х", "h"
|
174
|
+
sub "ц", "c"
|
175
|
+
sub "ч", "č"
|
176
|
+
sub "ш", "š"
|
177
|
+
sub "щ", "št"
|
178
|
+
sub "ъ", "ǎ"
|
179
|
+
sub "ь", "j"
|
180
|
+
sub "ю", "yu"
|
181
|
+
sub "я", "ya"
|
182
|
+
|
183
|
+
}
|
184
|
+
|
185
|
+
# ŠT
|
186
|
+
sub capture(maybe(upper)) + "Št" + capture(upper), ref(1) + "ŠT" + ref(2)
|
187
|
+
sub capture(upper) + "Št" + capture(maybe(upper)), ref(1) + "ŠT" + ref(2)
|
188
|
+
|
189
|
+
# YU
|
190
|
+
sub capture(maybe(upper)) + "Yu" + capture(upper), ref(1) + "YU" + ref(2)
|
191
|
+
sub capture(upper) + "Yu" + capture(maybe(upper)), ref(1) + "YU" + ref(2)
|
192
|
+
|
193
|
+
# YA
|
194
|
+
sub capture(maybe(upper)) + "Ya" + capture(upper), ref(1) + "YA" + ref(2)
|
195
|
+
sub capture(upper) + "Ya" + capture(maybe(upper)), ref(1) + "YA" + ref(2)
|
196
|
+
}
|
197
|
+
|
@@ -4,12 +4,16 @@ metadata {
|
|
4
4
|
language: iso-639-2:ell
|
5
5
|
source_script: Grek
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Greek 1.0 (Phonetic transcription)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
9
|
creation_date: 1987
|
10
10
|
description: |
|
11
11
|
UNGEGN Romanization table for Greek: Phonetic transcription
|
12
12
|
|
13
|
+
UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of
|
14
|
+
Geographical Names. Writing Systems and Guides to Pronunciation Romanization
|
15
|
+
> Conversion of the Greek alphabet into Latin characters. Paper submitted by
|
16
|
+
Greece and Cyprus.
|
13
17
|
|
14
18
|
notes:
|
15
19
|
- Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: un
|
3
|
-
id: 1987-
|
3
|
+
id: 1987-ts
|
4
4
|
language: iso-639-2:ell
|
5
5
|
source_script: Grek
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Greek -- UNGEGN 4.0 (transcription)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
9
|
creation_date: 1987
|
10
10
|
description: |
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:guj
|
5
5
|
source_script: Gujr
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Gujarati -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_gu.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Hindi -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_hi.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kan
|
5
5
|
source_script: Kana
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Kannada -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_kn.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mal
|
5
5
|
source_script: Mlym
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Malayalam -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_ml.htm
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Marathi -- UNGEGN 4.0
|
8
8
|
url: https://www.eki.ee/wgrs/rom1_mr.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2016
|
@@ -0,0 +1,119 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: id
|
3
|
+
id: 1977
|
4
|
+
language: iso-639-2:mkd
|
5
|
+
source_script: Cyrl
|
6
|
+
destination_script: Latn
|
7
|
+
name: Romanization of Macedonian geographical names (1977)
|
8
|
+
url: https://www.eki.ee/wgrs/v2_2/rom1_mk.htm
|
9
|
+
creation_date: 1977
|
10
|
+
description: |
|
11
|
+
The United Nations recommended system was approved in 1977 (III/11), based on the romanization of the Serbo-Croatian and Macedonian Cyrillic alphabets that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution (Third United Nations Conference on the Standardization of Geographical Names. Athens, 17 August - 7 September 1977. Vol. I. Report of the Conference, pp. 29, 31).
|
12
|
+
The system is used in The former Yugoslav Republic of Macedonia (see e.g. Report of The former Yugoslav Republic of Macedonia. Seventh United Nations Conference on the Standardization of Geographical Names. New York, 13-22 January 1998. Document E/CONF.91/CRP.23) and in international cartographic products.
|
13
|
+
The Cyrillic alphabet is used. The romanization table is unambiguous and can be applied automatically. The system is on the whole reversible with the exception of the characters ѓ and ќ. These are romanized as g and k, respectively, before е and и. But also г and к are occasionally used before е and и, so, for example, the name Makedonija is reconstituted as Македонија, not Маќедонија in the Cyrillic source script.
|
14
|
+
}
|
15
|
+
|
16
|
+
tests {
|
17
|
+
test "Маќедонија", "Makedonija"
|
18
|
+
test "Општина Ердут", "Opština Erdut"
|
19
|
+
test "Општина Двор", "Opština Dvor"
|
20
|
+
test "ЛУЃЕ луѓе", "LUGE luge"
|
21
|
+
test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
|
22
|
+
test "ЌАРУВАЊЕ ќарување", "ĆARUVANJE ćaruvanje"
|
23
|
+
}
|
24
|
+
|
25
|
+
dependency "posix", import: true
|
26
|
+
|
27
|
+
stage {
|
28
|
+
sub "Ѓ", "G", after: any("ЕИеи")
|
29
|
+
sub "ѓ", "g", after: any("ЕИеи")
|
30
|
+
sub "Ќ", "K", after: any("ЕИеи")
|
31
|
+
sub "ќ", "k", after: any("ЕИеи")
|
32
|
+
|
33
|
+
# CHARACTERS
|
34
|
+
parallel {
|
35
|
+
sub "А", "A"
|
36
|
+
sub "Б", "B"
|
37
|
+
sub "В", "V"
|
38
|
+
sub "Г", "G"
|
39
|
+
sub "Д", "D"
|
40
|
+
sub "Ѓ", "Đ" # Đ
|
41
|
+
sub "Е", "E"
|
42
|
+
sub "Ж", "Ž" # Ž
|
43
|
+
sub "З", "Z"
|
44
|
+
sub "Ѕ", "Dz"
|
45
|
+
sub "И", "I"
|
46
|
+
sub "Ј", "J"
|
47
|
+
sub "К", "K"
|
48
|
+
sub "Л", "L"
|
49
|
+
sub "Љ", "Lj"
|
50
|
+
sub "М", "M"
|
51
|
+
sub "Н", "N"
|
52
|
+
sub "Њ", "Nj"
|
53
|
+
sub "О", "O"
|
54
|
+
sub "П", "P"
|
55
|
+
sub "Р", "R"
|
56
|
+
sub "С", "S"
|
57
|
+
sub "Т", "T"
|
58
|
+
sub "Ќ", "Ć" # Ć
|
59
|
+
sub "У", "U"
|
60
|
+
sub "Ф", "F"
|
61
|
+
sub "Х", "H"
|
62
|
+
sub "Ц", "C"
|
63
|
+
sub "Ч", "Č" # Č
|
64
|
+
sub "Џ", "Dž" # Dž
|
65
|
+
sub "Ш", "Š" # Š
|
66
|
+
sub "а", "a"
|
67
|
+
sub "б", "b"
|
68
|
+
sub "в", "v"
|
69
|
+
sub "г", "g"
|
70
|
+
sub "д", "d"
|
71
|
+
sub "ѓ", "đ" # đ
|
72
|
+
sub "е", "e"
|
73
|
+
sub "ж", "ž" # ž
|
74
|
+
sub "з", "z"
|
75
|
+
sub "ѕ", "dz"
|
76
|
+
sub "и", "i"
|
77
|
+
sub "ј", "j"
|
78
|
+
sub "к", "k"
|
79
|
+
sub "л", "l"
|
80
|
+
sub "љ", "lj"
|
81
|
+
sub "м", "m"
|
82
|
+
sub "н", "n"
|
83
|
+
sub "њ", "nj"
|
84
|
+
sub "о", "o"
|
85
|
+
sub "п", "p"
|
86
|
+
sub "р", "r"
|
87
|
+
sub "с", "s"
|
88
|
+
sub "т", "t"
|
89
|
+
sub "ќ", "ć" # ć
|
90
|
+
sub "у", "u"
|
91
|
+
sub "ф", "f"
|
92
|
+
sub "х", "h"
|
93
|
+
sub "ц", "c"
|
94
|
+
sub "ч", "č" # č
|
95
|
+
sub "џ", "dž" # dž
|
96
|
+
sub "ш", "š" # š
|
97
|
+
}
|
98
|
+
|
99
|
+
# POSTRULES
|
100
|
+
# rewritten by hand to work properly
|
101
|
+
# DZ
|
102
|
+
sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
|
103
|
+
sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
|
104
|
+
|
105
|
+
#LJ
|
106
|
+
sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
|
107
|
+
sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
|
108
|
+
|
109
|
+
#NJ
|
110
|
+
sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
|
111
|
+
sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
|
112
|
+
|
113
|
+
#DŽ
|
114
|
+
sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
|
115
|
+
sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
|
116
|
+
|
117
|
+
compose
|
118
|
+
}
|
119
|
+
|