interscript-maps 2.2.0 → 2.2.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (192) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +300 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  18. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  19. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  21. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  23. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  25. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
  26. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
  27. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  29. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  30. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  31. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  32. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  33. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  34. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  35. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  36. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  37. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  38. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  39. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  40. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  41. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  42. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  43. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  45. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  46. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  47. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  48. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  49. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  50. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  51. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  52. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  53. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  54. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  55. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  56. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  57. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  58. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  59. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  60. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  61. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  62. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  63. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  64. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  65. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  67. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  68. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  69. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  70. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  71. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  72. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  73. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  74. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  75. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  76. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  77. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  78. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  79. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  80. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  81. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  82. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  83. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  84. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
  85. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
  86. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  87. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  88. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  89. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  90. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  91. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  92. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  93. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  94. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  95. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  96. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  97. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  98. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  99. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  100. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  101. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  102. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  103. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  104. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  105. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  106. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  107. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  108. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  109. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  110. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  111. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  112. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  113. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  114. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  115. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  116. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  117. data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
  118. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  119. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
  120. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  121. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  122. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  123. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  124. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  125. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  126. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  127. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  128. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  129. data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
  130. data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
  131. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  132. data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
  133. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  134. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
  135. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
  136. data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
  137. data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
  138. data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
  139. data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
  140. data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
  141. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  142. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  143. data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
  144. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  145. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  146. data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
  147. data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
  148. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
  149. data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
  150. data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
  151. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  152. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  153. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
  154. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  155. data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
  156. data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
  157. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
  158. data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
  159. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  160. data/maps/un-ara-Arab-Latn-1971.imp +5 -5
  161. data/maps/un-ara-Arab-Latn-1972.imp +4 -4
  162. data/maps/un-ara-Arab-Latn-2017.imp +15 -15
  163. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  164. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  165. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  166. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  167. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  168. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  169. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  170. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  171. data/maps/un-hin-Deva-Latn-2016.imp +1 -1
  172. data/maps/un-kan-Kana-Latn-2016.imp +1 -1
  173. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  174. data/maps/un-mar-Deva-Latn-2016.imp +1 -1
  175. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  176. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  177. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  178. data/maps/un-nep-Deva-Latn-1972.imp +1 -1
  179. data/maps/un-nep-Deva-Latn-2013.imp +1 -1
  180. data/maps/un-ori-Orya-Latn-1972.imp +1 -1
  181. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  182. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  183. data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
  184. data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
  185. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  186. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  187. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  188. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  189. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  190. data/maps/un-urd-Arab-Latn-1972.imp +15 -15
  191. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  192. metadata +7 -1
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF ARABIC -- UNGEGN 2017 System
7
+ name: Romanization of Arabic -- UNGEGN (2017)
8
8
  url: http://www.eki.ee/wgrs/rom1_ar.pdf
9
9
  creation_date: 2017
10
10
  confirmation_date: 2018-06
@@ -141,20 +141,20 @@ stage {
141
141
  # (B) Marks doubling of the consonant.
142
142
 
143
143
  # Sun letters
144
- sub boundary + "\u0627\u0644\u062a", "at t" # الت
145
- sub boundary + "\u0627\u0644\u062b", "ath th" # الث
146
- sub boundary + "\u0627\u0644\u062f", "ad d" # الد
147
- sub boundary + "\u0627\u0644\u0630", "adh dh" # الذ
148
- sub boundary + "\u0627\u0644\u0631", "ar r" # الر
149
- sub boundary + "\u0627\u0644\u0632", "az z" # الز
150
- sub boundary + "\u0627\u0644\u0633", "as s" # الس
151
- sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
152
- sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
153
- sub boundary + "\u0627\u0644\u0636", "aḏ ḏ" # الض
154
- sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
155
- sub boundary + "\u0627\u0644\u0638", "ad͟h d͟h" # الظ
156
- sub boundary + "\u0627\u0644\u0644", "al l" # الل
157
- sub boundary + "\u0627\u0644\u0646", "an n" # الن
144
+ sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
145
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "ath th" # الث
146
+ sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
147
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "adh dh" # الذ
148
+ sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
149
+ sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
150
+ sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
151
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
152
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
153
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḏ ḏ" # الض
154
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
155
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "ad͟h d͟h" # الظ
156
+ sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
157
+ sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
158
158
 
159
159
  # TODO: shorten this fragment
160
160
  # ta' marboota
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Assamese Romanization, Version 4.0
7
+ name: Romanization of Assamese -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_as.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: National System of Geographic Names Transmission into Roman Alphabet in Belarus
7
+ name: Romanization of Belarusian geographic names (2007)
8
8
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/crp/9th_UNCSGN_e-conf-98-crp-21.pdf
9
9
  creation_date: 2007
10
10
  description: |
@@ -16,7 +16,7 @@ metadata {
16
16
  Republic of Belarus in letters of the Latin alphabet
17
17
 
18
18
  Based on the Regulation on the State Property Committee of the Republic of Belarus,
19
- approved by the Decree of the Council of Ministers of the Republic of Belarusdated July 29, 2006
19
+ approved by the Decree of the Council of Ministers of the Republic of Belarus dated July 29, 2006
20
20
  No. 958 "Issues of the State Committee on Property of the Republic of Belarus"
21
21
  }
22
22
 
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: Bengali Romanization, Version 4.0
7
+ name: Romanization of Bengali -- UNGEGN 4.0
8
8
  url: http://www.eki.ee/wgrs/rom1_bn.htm
9
9
  creation_date: 2016
10
10
  description: |
@@ -0,0 +1,197 @@
1
+ metadata {
2
+ authority_id: un
3
+ id: 1977
4
+ language: iso-639-2:bul
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Romanization of Bulgarian geographical names (1977)
8
+ url: https://www.eki.ee/wgrs/res/res_3_10.htm
9
+ creation_date: 1977
10
+ description: |
11
+ The System of Transliteration and Transcription of Bulgarian Geographical Names into Roman letters,
12
+ as shown in the annex below, be adopted as the international system for the romanization of Bulgarian geographical names.
13
+ }
14
+
15
+ tests {
16
+ test "нунатак Абрит", "nunatak Abrit"
17
+ test "връх Академия", "vrǎh Akademiya"
18
+ test "връх Ами Буе", "vrǎh Ami Bue"
19
+ test "нос Айтос", "nos Ajtos"
20
+ test "залив Баба Тонка", "zaliv Baba Tonka"
21
+ test "Балабански камък", "Balabanski kamǎk"
22
+ test "Бедечки поток", "Bedečki potok"
23
+ test "нос Бяга БЯГА", "nos Byaga BYAGA"
24
+ test "остров Качо", "ostrov Kačo" # wiki ostrov Cacho
25
+ test "Чакъров остров", "Čakǎrov ostrov"
26
+ test "връх Дъбник", "vrǎh Dǎbnik"
27
+ test "залив Десислава", "zaliv Desislava"
28
+ test "ледник Джераси", "lednik Džerasi"
29
+ test "Джегова скала", "Džegova skala"
30
+ test "Нунатак Едуард", "Nunatak Eduard"
31
+ test "Елховска седловина", "Elhovska sedlovina"
32
+ test "ледник Етър", "lednik Etǎr"
33
+ test "нунатак Филип Тотю", "nunatak Filip Totyu"
34
+ test "ледник Габаре", "lednik Gabare"
35
+ test "риф Гергини", "rif Gergini"
36
+ test "Гяуров връх", "Gyaurov vrǎh"
37
+ test "Гуцалски рид", "Gucalski rid" # not found
38
+ test "Хараламбиев остров", "Haralambiev ostrov"
39
+ test "връх Ичера", "vrǎh Ičera"
40
+ test "полуостров Йоан Павел II", "poluostrov Joan Pavel II"
41
+ test "нос Иван Александър", "nos Ivan Aleksandǎr"
42
+ test "нос Иречек", "nos Ireček"
43
+ test "нос Кърджали", "nos Kǎrdžali"
44
+ test "седловина Кърнаре", "sedlovina Kǎrnare"
45
+ test "нунатак Керсеблепт", "nunatak Kerseblept"
46
+ test "Кондофрейски възвишения", "Kondofrejski vǎzvišeniya"
47
+ test "Костинбродски проход", "Kostinbrodski prohod"
48
+ test "връх Кожух", "vrǎh Kožuh"
49
+ test "Кукерски нунатаци", "Kukerski nunataci"
50
+ test "залив Лазурен бряг", "zaliv Lazuren bryag"
51
+ test "връх Лудогорие", "vrǎh Ludogorie"
52
+ test "Лютибродски скали", "Lyutibrodski skali"
53
+ test "Масларов нунатак", "Maslarov nunatak"
54
+ test "Михневски връх", "Mihnevski vrǎh"
55
+ test "рид Митино", "rid Mitino"
56
+ test "езеро Наяда", "ezero Nayada"
57
+ test "нос Никюп НИКЮП", "nos Nikyup NIKYUP"
58
+ test "рид Оборище ОБОРИЩЕ", "rid Oborište OBORIŠTE"
59
+ test "залив Олуша", "zaliv Oluša"
60
+ test "Оряховски възвишения", "Oryahovski vǎzvišeniya"
61
+ test "нунатак Памидово", "nunatak Pamidovo"
62
+ test "връх Парангалица", "vrǎh Parangalica"
63
+ test "Първомайски провлак", "Pǎrvomajski provlak"
64
+ test "ледник Патлейна", "lednik Patlejna"
65
+ test "полуостров Перник", "poluostrov Pernik"
66
+ test "връх Петко Войвода", "vrǎh Petko Vojvoda"
67
+ test "остров Фанагория", "ostrov Fanagoriya"
68
+ test "нос Плас", "nos Plas"
69
+ test "Пресиянов рид", "Presiyanov rid"
70
+ test "връх Принсипе де Астуриас", "vrǎh Prinsipe de Asturias" # wiki: vrǎh Príncipe de Asturias
71
+ test "нунатак Ръченица", "nunatak Rǎčenica"
72
+ test "връх Райна Княгиня", "vrǎh Rajna Knyaginya"
73
+ test "Рид Ръжана", "Rid Rǎžana"
74
+ test "връх Ригс", "vrǎh Rigs"
75
+ test "остров Рогулят", "ostrov Rogulyat"
76
+ test "ледник Сабазий", "lednik Sabazij"
77
+ test "ледник Съединение", "lednik Sǎedinenie"
78
+ test "нунатак Сенокос", "nunatak Senokos"
79
+ test "Сейдолски камък", "Sejdolski kamǎk"
80
+ test "ледник Щерна", "lednik Šterna"
81
+ test "връх Шишман", "vrǎh Šišman"
82
+ test "ледник Сигмен", "lednik Sigmen"
83
+ test "Седловина Синитово", "Sedlovina Sinitovo"
84
+ test "Ледник Скаплизо", "Lednik Skaplizo"
85
+ test "залив Слънчев бряг", "zaliv Slǎnčev bryag"
86
+ test "остров Соатрис", "ostrov Soatris"
87
+ test "планина Софийски Университет", "planina Sofijski Universitet"
88
+ test "ледник Сребърна", "lednik Srebǎrna"
89
+ test "Средногорски възвишения", "Srednogorski vǎzvišeniya"
90
+ test "Св. Евтимиев камък", "Sv. Evtimiev kamǎk"
91
+ test "база Св. Климент Охридски", "baza Sv. Kliment Ohridski"
92
+ test "връх Стъргел", "vrǎh Stǎrgel"
93
+ test "нунатак Сторгозия", "nunatak Storgoziya" # nunatak Storgozia according to wiki
94
+ test "нунатак Сурвакари", "nunatak Survakari"
95
+ test "ледник Световрачене", "lednik Svetovračene"
96
+ test "остров Теменуга", "ostrov Temenuga"
97
+ test "Тракийски възвишения", "Trakijski vǎzvišeniya"
98
+ test "хълм Цамблак", "hǎlm Camblak"
99
+ test "ледник Урдовиза", "lednik Urdoviza"
100
+ test "остров Вълчедръм", "ostrov Vǎlčedrǎm"
101
+ test "острови Вардим", "ostrovi Vardim"
102
+ test "Владигеров проток", "Vladigerov protok"
103
+ test "ледник Ябланица", "lednik Yablanica"
104
+ test "залив Ямфорина", "zaliv Yamforina"
105
+ test "Йовков нос", "Jovkov nos"
106
+ test "рид Заберново", "rid Zabernovo"
107
+ test "ледник Збелсурд", "lednik Zbelsurd"
108
+ test "Жефарович камък", "Žefarovič kamǎk"
109
+ test "връх Зиези", "vrǎh Ziezi"
110
+ test "залив Златни пясъци", "zaliv Zlatni pyasǎci"
111
+ test "ледник Злокучене", "lednik Zlokučene"
112
+ test "проток Злогош", "protok Zlogoš"
113
+ }
114
+
115
+ dependency "posix", import: true
116
+
117
+ stage {
118
+
119
+ # CHARACTERS
120
+ parallel {
121
+ sub "А", "A"
122
+ sub "Б", "B"
123
+ sub "В", "V"
124
+ sub "Г", "G"
125
+ sub "Д", "D"
126
+ sub "Е", "E"
127
+ sub "Ж", "Ž"
128
+ sub "З", "Z"
129
+ sub "И", "I"
130
+ sub "Й", "J"
131
+ sub "К", "K"
132
+ sub "Л", "L"
133
+ sub "М", "M"
134
+ sub "Н", "N"
135
+ sub "О", "O"
136
+ sub "П", "P"
137
+ sub "Р", "R"
138
+ sub "С", "S"
139
+ sub "Т", "T"
140
+ sub "У", "U"
141
+ sub "Ф", "F"
142
+ sub "Х", "H"
143
+ sub "Ц", "C"
144
+ sub "Ч", "Č"
145
+ sub "Ш", "Š"
146
+ sub "Щ", "Št"
147
+ sub "Ъ", "Ǎ"
148
+ sub "Ь", "J"
149
+ sub "Ю", "Yu"
150
+ sub "Я", "Ya"
151
+
152
+ sub "а", "a"
153
+ sub "б", "b"
154
+ sub "в", "v"
155
+ sub "г", "g"
156
+ sub "д", "d"
157
+ sub "е", "e"
158
+ sub "ж", "ž"
159
+ sub "з", "z"
160
+ sub "и", "i"
161
+ sub "й", "j"
162
+ sub "к", "k"
163
+ sub "л", "l"
164
+ sub "м", "m"
165
+ sub "н", "n"
166
+ sub "о", "o"
167
+ sub "п", "p"
168
+ sub "р", "r"
169
+ sub "с", "s"
170
+ sub "т", "t"
171
+ sub "у", "u"
172
+ sub "ф", "f"
173
+ sub "х", "h"
174
+ sub "ц", "c"
175
+ sub "ч", "č"
176
+ sub "ш", "š"
177
+ sub "щ", "št"
178
+ sub "ъ", "ǎ"
179
+ sub "ь", "j"
180
+ sub "ю", "yu"
181
+ sub "я", "ya"
182
+
183
+ }
184
+
185
+ # ŠT
186
+ sub capture(maybe(upper)) + "Št" + capture(upper), ref(1) + "ŠT" + ref(2)
187
+ sub capture(upper) + "Št" + capture(maybe(upper)), ref(1) + "ŠT" + ref(2)
188
+
189
+ # YU
190
+ sub capture(maybe(upper)) + "Yu" + capture(upper), ref(1) + "YU" + ref(2)
191
+ sub capture(upper) + "Yu" + capture(maybe(upper)), ref(1) + "YU" + ref(2)
192
+
193
+ # YA
194
+ sub capture(maybe(upper)) + "Ya" + capture(upper), ref(1) + "YA" + ref(2)
195
+ sub capture(upper) + "Ya" + capture(maybe(upper)), ref(1) + "YA" + ref(2)
196
+ }
197
+
@@ -4,12 +4,16 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of Geographical Names. Writing Systems and Guides to Pronunciation Romanization > Conversion of the Greek alphabet into Latin characters. Paper submitted by Greece and Cyprus.
7
+ name: Romanization of Greek 1.0 (Phonetic transcription)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
11
11
  UNGEGN Romanization table for Greek: Phonetic transcription
12
12
 
13
+ UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of
14
+ Geographical Names. Writing Systems and Guides to Pronunciation Romanization
15
+ > Conversion of the Greek alphabet into Latin characters. Paper submitted by
16
+ Greece and Cyprus.
13
17
 
14
18
  notes:
15
19
  - Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v4.0
7
+ name: Romanization of Greek -- UNGEGN 4.0 (transliteration)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -1,10 +1,10 @@
1
1
  metadata {
2
2
  authority_id: un
3
- id: 1987-tl
3
+ id: 1987-ts
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v4.0
7
+ name: Romanization of Greek -- UNGEGN 4.0 (transcription)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:guj
5
5
  source_script: Gujr
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Gujarati Romanization Version 4.0
7
+ name: Romanization of Gujarati -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_gu.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
7
+ name: Romanization of Hindi -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kan
5
5
  source_script: Kana
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
7
+ name: Romanization of Kannada -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_kn.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mal
5
5
  source_script: Mlym
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Malayalam Romanization Version 4.0
7
+ name: Romanization of Malayalam -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_ml.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Marathi Romanization, 1972
7
+ name: Romanization of Marathi -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_mr.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -0,0 +1,119 @@
1
+ metadata {
2
+ authority_id: id
3
+ id: 1977
4
+ language: iso-639-2:mkd
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Romanization of Macedonian geographical names (1977)
8
+ url: https://www.eki.ee/wgrs/v2_2/rom1_mk.htm
9
+ creation_date: 1977
10
+ description: |
11
+ The United Nations recommended system was approved in 1977 (III/11), based on the romanization of the Serbo-Croatian and Macedonian Cyrillic alphabets that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution (Third United Nations Conference on the Standardization of Geographical Names. Athens, 17 August - 7 September 1977. Vol. I. Report of the Conference, pp. 29, 31).
12
+ The system is used in The former Yugoslav Republic of Macedonia (see e.g. Report of The former Yugoslav Republic of Macedonia. Seventh United Nations Conference on the Standardization of Geographical Names. New York, 13-22 January 1998. Document E/CONF.91/CRP.23) and in international cartographic products.
13
+ The Cyrillic alphabet is used. The romanization table is unambiguous and can be applied automatically. The system is on the whole reversible with the exception of the characters ѓ and ќ. These are romanized as g and k, respectively, before е and и. But also г and к are occasionally used before е and и, so, for example, the name Makedonija is reconstituted as Македонија, not Маќедонија in the Cyrillic source script.
14
+ }
15
+
16
+ tests {
17
+ test "Маќедонија", "Makedonija"
18
+ test "Општина Ердут", "Opština Erdut"
19
+ test "Општина Двор", "Opština Dvor"
20
+ test "ЛУЃЕ луѓе", "LUGE luge"
21
+ test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
22
+ test "ЌАРУВАЊЕ ќарување", "ĆARUVANJE ćaruvanje"
23
+ }
24
+
25
+ dependency "posix", import: true
26
+
27
+ stage {
28
+ sub "Ѓ", "G", after: any("ЕИеи")
29
+ sub "ѓ", "g", after: any("ЕИеи")
30
+ sub "Ќ", "K", after: any("ЕИеи")
31
+ sub "ќ", "k", after: any("ЕИеи")
32
+
33
+ # CHARACTERS
34
+ parallel {
35
+ sub "А", "A"
36
+ sub "Б", "B"
37
+ sub "В", "V"
38
+ sub "Г", "G"
39
+ sub "Д", "D"
40
+ sub "Ѓ", "Đ" # Đ
41
+ sub "Е", "E"
42
+ sub "Ж", "Ž" # Ž
43
+ sub "З", "Z"
44
+ sub "Ѕ", "Dz"
45
+ sub "И", "I"
46
+ sub "Ј", "J"
47
+ sub "К", "K"
48
+ sub "Л", "L"
49
+ sub "Љ", "Lj"
50
+ sub "М", "M"
51
+ sub "Н", "N"
52
+ sub "Њ", "Nj"
53
+ sub "О", "O"
54
+ sub "П", "P"
55
+ sub "Р", "R"
56
+ sub "С", "S"
57
+ sub "Т", "T"
58
+ sub "Ќ", "Ć" # Ć
59
+ sub "У", "U"
60
+ sub "Ф", "F"
61
+ sub "Х", "H"
62
+ sub "Ц", "C"
63
+ sub "Ч", "Č" # Č
64
+ sub "Џ", "Dž" # Dž
65
+ sub "Ш", "Š" # Š
66
+ sub "а", "a"
67
+ sub "б", "b"
68
+ sub "в", "v"
69
+ sub "г", "g"
70
+ sub "д", "d"
71
+ sub "ѓ", "đ" # đ
72
+ sub "е", "e"
73
+ sub "ж", "ž" # ž
74
+ sub "з", "z"
75
+ sub "ѕ", "dz"
76
+ sub "и", "i"
77
+ sub "ј", "j"
78
+ sub "к", "k"
79
+ sub "л", "l"
80
+ sub "љ", "lj"
81
+ sub "м", "m"
82
+ sub "н", "n"
83
+ sub "њ", "nj"
84
+ sub "о", "o"
85
+ sub "п", "p"
86
+ sub "р", "r"
87
+ sub "с", "s"
88
+ sub "т", "t"
89
+ sub "ќ", "ć" # ć
90
+ sub "у", "u"
91
+ sub "ф", "f"
92
+ sub "х", "h"
93
+ sub "ц", "c"
94
+ sub "ч", "č" # č
95
+ sub "џ", "dž" # dž
96
+ sub "ш", "š" # š
97
+ }
98
+
99
+ # POSTRULES
100
+ # rewritten by hand to work properly
101
+ # DZ
102
+ sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
103
+ sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
104
+
105
+ #LJ
106
+ sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
107
+ sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
108
+
109
+ #NJ
110
+ sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
111
+ sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
112
+
113
+ #DŽ
114
+ sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
115
+ sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
116
+
117
+ compose
118
+ }
119
+