interscript-maps 2.1.0rc4 → 2.1.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (255) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +111 -326
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +14 -18
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  18. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  19. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  21. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  23. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  25. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
  26. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
  27. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  29. data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
  30. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  31. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  32. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  33. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  34. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  35. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  36. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  37. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  38. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  39. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  40. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  41. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  42. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  43. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  44. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  45. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  46. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  47. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  48. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  49. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  50. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  51. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  52. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  53. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  54. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  55. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +4 -7
  56. data/maps/az-aze-Cyrl-Latn-1939.imp +0 -1
  57. data/maps/az-aze-Cyrl-Latn-1958.imp +0 -1
  58. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
  59. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  61. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  62. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  63. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  64. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  65. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  66. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  67. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
  68. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +1 -4
  69. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +4 -10
  70. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  71. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +1 -2
  72. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  73. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  74. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  75. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  76. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  77. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +3 -4
  78. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  79. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  80. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  81. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  82. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  83. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  84. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  85. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  86. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  87. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  88. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +5 -5
  89. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +5 -5
  90. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  91. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  92. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  93. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  94. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  95. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  96. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  97. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  98. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  99. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  100. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  101. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  102. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  103. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +3 -5
  104. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  105. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  106. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  107. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  108. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  109. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  110. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  111. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  112. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  113. data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
  114. data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
  115. data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
  116. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
  117. data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
  118. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
  119. data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
  120. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
  121. data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
  122. data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
  123. data/maps/by-bel-Cyrl-Latn-2007.imp +5 -7
  124. data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
  125. data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
  126. data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
  127. data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
  128. data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
  129. data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
  130. data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
  131. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  132. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +2 -1
  133. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  134. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  135. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
  136. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  137. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  138. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  139. data/maps/iso-ara-Arab-Latn-233-1984.imp +15 -15
  140. data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
  141. data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
  142. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
  146. data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
  147. data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
  149. data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
  150. data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
  151. data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
  152. data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
  154. data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
  155. data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
  156. data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
  157. data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
  158. data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
  159. data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
  161. data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
  162. data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +16 -16
  164. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
  165. data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
  166. data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
  167. data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
  168. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  169. data/maps/mext-jpn-Hrkt-Latn-1954.imp +1 -2
  170. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  171. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  172. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  173. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  174. data/maps/mvd-bel-Cyrl-Latn-2010.imp +5 -2
  175. data/maps/mvd-rus-Cyrl-Latn-2008.imp +3 -4
  176. data/maps/mvd-rus-Cyrl-Latn-2010.imp +5 -2
  177. data/maps/odni-ara-Arab-Latn-2004.imp +2 -1
  178. data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
  179. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  180. data/maps/odni-bel-Cyrl-Latn-2015.imp +4 -2
  181. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  182. data/maps/odni-bul-Cyrl-Latn-2015.imp +3 -1
  183. data/maps/odni-che-Cyrl-Latn-2015.imp +2 -1
  184. data/maps/odni-fas-Arab-Latn-2004.imp +15 -14
  185. data/maps/odni-fas-Arab-Latn-2015.imp +17 -17
  186. data/maps/odni-hin-Deva-Latn-2004.imp +21 -20
  187. data/maps/odni-hin-Deva-Latn-2015.imp +27 -26
  188. data/maps/odni-kat-Geor-Latn-2015.imp +5 -3
  189. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  190. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  191. data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
  192. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  193. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  194. data/maps/odni-prs-Arab-Latn-2004.imp +1 -0
  195. data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
  196. data/maps/odni-pus-Arab-Latn-2011.imp +2 -1
  197. data/maps/odni-rus-Cyrl-Latn-2015.imp +3 -1
  198. data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -1
  199. data/maps/odni-srp-Cyrl-Latn-2015.imp +9 -7
  200. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  201. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  202. data/maps/odni-tuk-Cyrl-Latn-2015.imp +2 -1
  203. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  204. data/maps/odni-ukr-Cyrl-Latn-2015.imp +4 -2
  205. data/maps/odni-urd-Arab-Latn-2015.imp +22 -21
  206. data/maps/odni-uzb-Cyrl-Latn-2015.imp +3 -1
  207. data/maps/ses-ara-Arab-Latn-1930.imp +60 -17
  208. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  209. data/maps/un-ara-Arab-Latn-1971.imp +6 -6
  210. data/maps/un-ara-Arab-Latn-1972.imp +5 -5
  211. data/maps/un-ara-Arab-Latn-2017.imp +16 -16
  212. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  213. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  214. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  215. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +1 -5
  216. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  217. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  218. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  219. data/maps/un-hin-Deva-Latn-2016.imp +2 -2
  220. data/maps/un-kan-Kana-Latn-2016.imp +2 -2
  221. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  222. data/maps/un-mar-Deva-Latn-2016.imp +2 -2
  223. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  224. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  225. data/maps/un-nep-Deva-Latn-1972.imp +2 -2
  226. data/maps/un-nep-Deva-Latn-2013.imp +2 -2
  227. data/maps/un-ori-Orya-Latn-1972.imp +2 -2
  228. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  229. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  230. data/maps/un-rus-Cyrl-Latn-1987.imp +2 -2
  231. data/maps/un-sin-Sinh-Latn-1972.imp +4 -16
  232. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  233. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  234. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  235. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  236. data/maps/un-urd-Arab-Latn-1972.imp +16 -16
  237. data/maps/var-amh-Ethi-Latn-eae-2003.imp +43 -48
  238. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
  239. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
  240. data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
  241. data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
  242. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +1 -0
  243. data/maps/var-mon-Mong-Latn-1930.imp +1 -1
  244. data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
  245. data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
  246. data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
  247. data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
  248. metadata +3 -10
  249. data/maps/alalc-tir-Ethi-Latn-1997.imp +0 -429
  250. data/maps/alalc-tir-Ethi-Latn-2011.imp +0 -85
  251. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +0 -511
  252. data/maps/un-bul-Cyrl-Latn-1977.imp +0 -197
  253. data/maps/un-mkd-Cyrl-Latn-1977.imp +0 -119
  254. data/maps/un-srp-Cyrl-Latn-1997.imp +0 -47
  255. data/maps/var-ara-Arab-Arab-rababa.imp +0 -25
@@ -1,15 +1,58 @@
1
1
  metadata {
2
- authority_id: ses
2
+ authority_id: ungegn
3
3
  id: 1930
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Survey of Egypt Romanization
7
+ name: ROMANIZATION OF ARABIC -- UNGEGN 2017 System
8
8
  url: http://www.eki.ee/wgrs/rom1_ar.pdf
9
9
  creation_date: 1930
10
10
  confirmation_date: 2018-06
11
11
  description: |
12
- The Survey of Egypt System (SES) of Romanization.
12
+ The current United Nations recommended romanization
13
+ system was approved in 2017 (resolution XI/3), based on
14
+ the system adopted by Arabic experts at the conference
15
+ held in Beirut in 2007, the Unified Arabic
16
+ Transliteration System, taking into account the
17
+ practical amendments and corrections carried out and
18
+ agreed upon by the representatives of the Arabic-
19
+ speaking countries at the Fourth Arab Conference on
20
+ Geographical Names, held in Beirut in 2008, and some
21
+ clarifications and amendments agreed in Riyadh in 20171.
22
+ Previously, the United Nations had approved a
23
+ romanization system in 1972 (resolution II/8), based on the
24
+ system adopted by Arabic experts at the conference
25
+ held at Beirut in 1971 with the practical amendments carried out
26
+ and agreed upon by the representatives of the Arabic-speaking
27
+ countries at their conference. The table was published in volume
28
+ II of the conference report.
29
+ In UN resolution XI/3 it is specifically stated that the
30
+ system was recommended for the “romanization of the
31
+ geographical names within those Arabic-speaking countries
32
+ where this system is officially adopted”. There is
33
+ evidence of its partial implementation in Jordan, Oman and
34
+ Saudi Arabia. The UNGEGN Working Group on Romanization
35
+ Systems intends to continue monitoring the UN system’s
36
+ implementation across Arabic-speaking countries.
37
+ In some countries there exist local romanization schemes
38
+ or practices. The geographical names of Algeria, Djibouti,
39
+ Mauritania, Morocco and Tunisia are generally rendered in
40
+ the traditional manner which conforms to the principles of
41
+ the French orthography.
42
+ The previous UN-approved system is still found in
43
+ considerable international usage.
44
+ Arabic is written from right to left. The Arabic script
45
+ usually omits vowel points and diacritical marks from
46
+ writing which makes it difficult to obtain uniform results
47
+ in the romanization of Arabic. It is essential to identify
48
+ correctly the words which appear in any particular name
49
+ and to know the standard Arabic-script spelling including
50
+ the relevant vowels. One must also take into account
51
+ dialectal and idiosyncratic deviations. The romanization
52
+ is generally reversible though there may be some ambiguous
53
+ letter sequences (dh, kh, sh, th) which may also point to
54
+ combinations of Arabic characters in addition to the
55
+ respective single characters.
13
56
  notes:
14
57
  - |
15
58
  The Survey of Egypt System (SES) of romanization has the following correspondences with
@@ -86,20 +129,20 @@ stage {
86
129
 
87
130
 
88
131
  # Sun letters
89
- sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "el-t" # الت
90
- sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), any(["el-th", "el-t"]) # الث
91
- sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "el-d" # الد
92
- sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), any(["el-dh", "el-z"]) # الذ
93
- sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "el-r" # الر
94
- sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "el-z" # الز
95
- sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), any(["el-s", "el-c"]) # الس
96
- sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "el-sh" # الش
97
- sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "el-ṣ" # الص
98
- sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "el-ḍ" # الض
99
- sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "el-ṭ" # الط
100
- sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), any(["el-ẓ", "el-d"]) # الظ
101
- sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "el-l" # الل
102
- sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "el-n" # الن
132
+ sub boundary + "\u0627\u0644\u062a", "el-t" # الت
133
+ sub boundary + "\u0627\u0644\u062b", any(["el-th", "el-t"]) # الث
134
+ sub boundary + "\u0627\u0644\u062f", "el-d" # الد
135
+ sub boundary + "\u0627\u0644\u0630", any(["el-dh", "el-z"]) # الذ
136
+ sub boundary + "\u0627\u0644\u0631", "el-r" # الر
137
+ sub boundary + "\u0627\u0644\u0632", "el-z" # الز
138
+ sub boundary + "\u0627\u0644\u0633", any(["el-s", "el-c"]) # الس
139
+ sub boundary + "\u0627\u0644\u0634", "el-sh" # الش
140
+ sub boundary + "\u0627\u0644\u0635", "el-ṣ" # الص
141
+ sub boundary + "\u0627\u0644\u0636", "el-ḍ" # الض
142
+ sub boundary + "\u0627\u0644\u0637", "el-ṭ" # الط
143
+ sub boundary + "\u0627\u0644\u0638", any(["el-ẓ", "el-d"]) # الظ
144
+ sub boundary + "\u0627\u0644\u0644", "el-l" # الل
145
+ sub boundary + "\u0627\u0644\u0646", "el-n" # الن
103
146
 
104
147
 
105
148
  # shadda
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:amh
5
5
  source_script: Ethi
6
6
  destination_script: Latn
7
- name: Romanization of Amharic -- UNGEGN (2016)
7
+ name: ROMANIZATION OF AMHARIC -- UNGEGN 2016 System
8
8
  url: http://www.eki.ee/wgrs/rom1_am.pdf
9
9
  creation_date: 1967
10
10
  confirmation_date: 2016-03
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 1971
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Romanization of Arabic -- Beirut system (1971)
7
+ name: 1971 "Beirut system"
8
8
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/2nd-uncsgn-docs/E_Conf61_4_Add1_e.pdf
9
9
  creation_date: 1971
10
10
  confirmation_date: 2018-06
@@ -85,10 +85,10 @@ stage {
85
85
  parallel {
86
86
 
87
87
  # sun letters
88
- sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "at͟h t͟h" # الث
89
- sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "ad͟h d͟h" # الذ
90
- sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "as͟h s͟h" # الش
91
- sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az͟h z͟h" # الظ
88
+ sub boundary + "\u0627\u0644\u062b", "at͟h t͟h" # الث
89
+ sub boundary + "\u0627\u0644\u0630", "ad͟h d͟h" # الذ
90
+ sub boundary + "\u0627\u0644\u0634", "as͟h s͟h" # الش
91
+ sub boundary + "\u0627\u0644\u0638", "az͟h z͟h" # الظ
92
92
 
93
93
  # shadda
94
94
  sub "\u062e\u0651", "k͟hk͟h" # خ
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 1972
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Romanization of Arabic -- UNGEGN (1972)
7
+ name: ROMANIZATION OF ARABIC -- UNGEGN 1972 System
8
8
  url: http://www.eki.ee/wgrs/obs_rom_vers/rom1_ar_v4_0.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2018-06
@@ -107,9 +107,9 @@ stage {
107
107
  # CHARACTERS
108
108
  parallel {
109
109
 
110
- sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
111
- sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḑ ḑ" # الض
112
- sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
110
+ sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
111
+ sub boundary + "\u0627\u0644\u0636", "aḑ ḑ" # الض
112
+ sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
113
113
 
114
114
  sub "\u062d\u0651", "ḩḩ" # ح
115
115
  sub "\u0635\u0651", "şş" # ص
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 2017
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Romanization of Arabic -- Unified Arabic Transliteration System (2017)
7
+ name: ROMANIZATION OF ARABIC -- UNGEGN 2017 System
8
8
  url: http://www.eki.ee/wgrs/rom1_ar.pdf
9
9
  creation_date: 2017
10
10
  confirmation_date: 2018-06
@@ -141,20 +141,20 @@ stage {
141
141
  # (B) Marks doubling of the consonant.
142
142
 
143
143
  # Sun letters
144
- sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
145
- sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "ath th" # الث
146
- sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
147
- sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "adh dh" # الذ
148
- sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
149
- sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
150
- sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
151
- sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
152
- sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
153
- sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḏ ḏ" # الض
154
- sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
155
- sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "ad͟h d͟h" # الظ
156
- sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
157
- sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
144
+ sub boundary + "\u0627\u0644\u062a", "at t" # الت
145
+ sub boundary + "\u0627\u0644\u062b", "ath th" # الث
146
+ sub boundary + "\u0627\u0644\u062f", "ad d" # الد
147
+ sub boundary + "\u0627\u0644\u0630", "adh dh" # الذ
148
+ sub boundary + "\u0627\u0644\u0631", "ar r" # الر
149
+ sub boundary + "\u0627\u0644\u0632", "az z" # الز
150
+ sub boundary + "\u0627\u0644\u0633", "as s" # الس
151
+ sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
152
+ sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
153
+ sub boundary + "\u0627\u0644\u0636", "aḏ ḏ" # الض
154
+ sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
155
+ sub boundary + "\u0627\u0644\u0638", "ad͟h d͟h" # الظ
156
+ sub boundary + "\u0627\u0644\u0644", "al l" # الل
157
+ sub boundary + "\u0627\u0644\u0646", "an n" # الن
158
158
 
159
159
  # TODO: shorten this fragment
160
160
  # ta' marboota
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: Romanization of Assamese -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Assamese Romanization, Version 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_as.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Romanization of Belarusian geographic names (2007)
7
+ name: National System of Geographic Names Transmission into Roman Alphabet in Belarus
8
8
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/crp/9th_UNCSGN_e-conf-98-crp-21.pdf
9
9
  creation_date: 2007
10
10
  description: |
@@ -16,7 +16,7 @@ metadata {
16
16
  Republic of Belarus in letters of the Latin alphabet
17
17
 
18
18
  Based on the Regulation on the State Property Committee of the Republic of Belarus,
19
- approved by the Decree of the Council of Ministers of the Republic of Belarus dated July 29, 2006
19
+ approved by the Decree of the Council of Ministers of the Republic of Belarusdated July 29, 2006
20
20
  No. 958 "Issues of the State Committee on Property of the Republic of Belarus"
21
21
  }
22
22
 
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: Romanization of Bengali -- UNGEGN 4.0
7
+ name: Bengali Romanization, Version 4.0
8
8
  url: http://www.eki.ee/wgrs/rom1_bn.htm
9
9
  creation_date: 2016
10
10
  description: |
@@ -4,16 +4,12 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: Romanization of Greek 1.0 (Phonetic transcription)
7
+ name: UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of Geographical Names. Writing Systems and Guides to Pronunciation Romanization > Conversion of the Greek alphabet into Latin characters. Paper submitted by Greece and Cyprus.
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
11
11
  UNGEGN Romanization table for Greek: Phonetic transcription
12
12
 
13
- UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of
14
- Geographical Names. Writing Systems and Guides to Pronunciation Romanization
15
- > Conversion of the Greek alphabet into Latin characters. Paper submitted by
16
- Greece and Cyprus.
17
13
 
18
14
  notes:
19
15
  - Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: Romanization of Greek -- UNGEGN 4.0 (transliteration)
7
+ name: UNGEGN Greek v4.0
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -1,10 +1,10 @@
1
1
  metadata {
2
2
  authority_id: un
3
- id: 1987-ts
3
+ id: 1987-tl
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: Romanization of Greek -- UNGEGN 4.0 (transcription)
7
+ name: UNGEGN Greek v4.0
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:guj
5
5
  source_script: Gujr
6
6
  destination_script: Latn
7
- name: Romanization of Gujarati -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Gujarati Romanization Version 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_gu.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 2016
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Romanization of Hindi -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 2016
4
4
  language: iso-639-2:kan
5
5
  source_script: Kana
6
6
  destination_script: Latn
7
- name: Romanization of Kannada -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/rom1_kn.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mal
5
5
  source_script: Mlym
6
6
  destination_script: Latn
7
- name: Romanization of Malayalam -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Malayalam Romanization Version 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_ml.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 2016
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Romanization of Marathi -- UNGEGN 4.0
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Marathi Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/rom1_mr.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Romanization of Mongolian in China -- UNGEGN 4.0
7
+ name: Mongolian Romanization in China, Version 4.0 (general)
8
8
  url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
9
  creation_date: 2013-09
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Romanization of Mongolian in China -- UNGEGN 4.0 (phonetic)
7
+ name: Mongolian Romanization in China, Version 4.0 (phonetic)
8
8
  url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
9
  creation_date: 2013-09
10
10
  description: |
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 1972
4
4
  language: iso-639-2:nep
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Romanization of Nepali (1972)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2010
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 2013
4
4
  language: iso-639-2:nep
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Romanization of Nepali (2013)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2013
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 1972
4
4
  language: iso-639-2:ori
5
5
  source_script: Orya
6
6
  destination_script: Latn
7
- name: Romanization of Oriya (1972)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Oriya Romanization, 1972
8
8
  url: http://www.eki.ee/wgrs/v2_2/rom1_or.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2003
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:pan
5
5
  source_script: Guru
6
6
  destination_script: Latn
7
- name: Romanization of Panjabi -- UNGEGN 4.0 (1972)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Panjabi Romanization Version 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_pa.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -5,7 +5,7 @@ metadata {
5
5
  # prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
6
6
  source_script: Arab
7
7
  destination_script: Latn
8
- name: Romanization of Persian (1967)
8
+ name: Persian UN 1967
9
9
  url: http://www.eki.ee/wgrs/v2_2/rom1_fa.htm
10
10
  creation_date: 1967
11
11
  confirmation_date: 01-2003
@@ -130,20 +130,20 @@ stage {
130
130
 
131
131
  # NOTE 1
132
132
  # Sun letters
133
- sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ot t" # الت
134
- sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "os̄ s̄" # الث
135
- sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "od d" # الد
136
- sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "oz̄ z̄" # الذ
137
- sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "or r" # الر
138
- sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "oz z" # الز
139
- sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "os s" # الس
140
- sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "osh sh" # الش
141
- sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "oş ş" # الص
142
- sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "oẕ ẕ" # الض
143
- sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "oţ ţ" # الط
144
- sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "oz̧ z̧" # الظ
145
- sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ol l" # الل
146
- sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "on n" # الن
133
+ sub boundary + "\u0627\u0644\u062a", "ot t" # الت
134
+ sub boundary + "\u0627\u0644\u062b", "os̄ s̄" # الث
135
+ sub boundary + "\u0627\u0644\u062f", "od d" # الد
136
+ sub boundary + "\u0627\u0644\u0630", "oz̄ z̄" # الذ
137
+ sub boundary + "\u0627\u0644\u0631", "or r" # الر
138
+ sub boundary + "\u0627\u0644\u0632", "oz z" # الز
139
+ sub boundary + "\u0627\u0644\u0633", "os s" # الس
140
+ sub boundary + "\u0627\u0644\u0634", "osh sh" # الش
141
+ sub boundary + "\u0627\u0644\u0635", "oş ş" # الص
142
+ sub boundary + "\u0627\u0644\u0636", "oẕ ẕ" # الض
143
+ sub boundary + "\u0627\u0644\u0637", "oţ ţ" # الط
144
+ sub boundary + "\u0627\u0644\u0638", "oz̧ z̧" # الظ
145
+ sub boundary + "\u0627\u0644\u0644", "ol l" # الل
146
+ sub boundary + "\u0627\u0644\u0646", "on n" # الن
147
147
 
148
148
  sub "\u0650\u064a\u0651", "īy" # ـِيَّ
149
149
  sub "\u0650\u064a", "iy", after: any("\u064e\u064f") # ـِي kasra followed by ي
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: un
2
+ authority_id: ungegn
3
3
  id: 1987
4
4
  language: iso-639-2:rus
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Romanization of Russian (1987)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Russian Romanization system
8
8
  url: http://www.eki.ee/wgrs/rom1_ru.htm
9
9
  creation_date: 1987
10
10
  confirmation_date: 2016
@@ -4,8 +4,7 @@ metadata {
4
4
  language: iso-639-2:sin
5
5
  source_script: Sinh
6
6
  destination_script: Latn
7
- name: Romanization of Sinhalese -- UNGEGN 4.0 (1972)
8
- source: "Second United Nations Conference on the Standardization of Geographical Names. London, 10–31 May 1972. Vol. II. Technical papers, pp. 151–152."
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Sinhalese Romanization Version 4.0
9
8
  url: https://www.eki.ee/wgrs/rom1_ml.htm
10
9
  creation_date: 1972
11
10
  confirmation_date: 2016
@@ -19,6 +18,7 @@ metadata {
19
18
  Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
20
19
  abbreviated form, to denote vowels after consonants.
21
20
 
21
+
22
22
  notes:
23
23
  - |
24
24
  The character ඇ was romanized as a͝i and the character ඈ as ai in Sharma's table, but there was no romanization for the character ඓ which,
@@ -37,13 +37,13 @@ metadata {
37
37
 
38
38
  tests {
39
39
  test "ශී‍්‍ර ලංකාවේ කී‍්‍රඩාව ඉතිහාසයේ ඉහළම තැනකට ගේන්න කටයුතු කරනවා", "shīra laṁkāve kīraḍāva itihāsaye ihaḷama tæ̆nakaṭa genna kaṭayutu karanavā"
40
- test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaṇḍae moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
40
+ test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaඬe moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
41
41
  test "ලෝක ළමා දිනයදා සිසුන් පිරිසක් කසිප්පු බීලා", "loka ḷamā dinayadā sisun pirisak kasippu bīlā"
42
42
  test "කෝටි 16ක හෙරොයින් සමග දන්කොටුවේදී 7ක් දැලේ", "koṭi 16ka hĕrŏyin samaga dankŏṭuvedī 7k dæ̆le"
43
43
  test "මිනුවන්ගොඩ පීසීආර් දෙදහසක් සිදුකරයි", "minuvangŏḍa pīsīār dĕdahasak sidukarayi"
44
44
  test "පාස්කු ප‍්‍රහාරය වගේම පාස්කු ප්‍රෝඩාව ගැනත් සොයන්න කොමිසමක් පත්කළ යුතුයි - විපක්‍ෂ නායක සජිත් පේ‍්‍රමදාස", "pāsku parahāraya vagema pāsku proḍāva gæ̆nat sŏyanna kŏmisamak patkaḷa yutuyi - vipakṣha nāyaka sajit peramadāsa"
45
45
  test "ට‍්‍රම්ප්ගේ සෞඛ්‍යය තීරණාත්මකයි - ට්විටර් හරහා ජනතාව අමතයි", "ṭarampge saukhyaya tīraṇātmakayi - ṭviṭar harahā janatāva amatayi"
46
- test "පාස්කු දා ප‍්‍රහාරය පිළිබඳ පරීක්‍ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibanda parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
46
+ test "පාස්කු දා ප‍්‍රහාරය පිළිබඳ පරීක්‍ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibaඳ parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
47
47
  test "දිල්ලි කැපිටල්ස් සහ කෝලිගේ බැංගලෝර් තෙවැනි ජය ලබයි", "dilli kæ̆piṭals saha kolige bæ̆ṁgalor tĕvæ̆ni jaya labayi"
48
48
  test "ශ‍්‍රී ලාංකික සම්භවයක් සහිත ප‍්‍රංශයේ පවුලක 5 ක් ඝාතනය කරලා", "sharī lāṁkika sambhavayak sahita paraṁshaye pavulaka 5 k ghātanaya karalā"
49
49
  test "පැතිකුදය ඉක්මනින් සුව කරන ප‍්‍රතිකාර", "pæ̆tikudaya ikmanin suva karana paratikāra"
@@ -171,18 +171,6 @@ stage {
171
171
  sub "ෆ", "fa"
172
172
  sub "ළ", "ḷa"
173
173
 
174
- # Prenasalized sounds
175
- sub "ඟ", "ṅga"
176
- sub "ඦ", "ñja"
177
- sub "ඬ", "ṇḍa"
178
- sub "ඳ", "nda"
179
- sub "ඹ", "mba"
180
-
181
- # Other ligatures
182
- sub "ක්‍ෂ", "kṣha"
183
- sub "ඥ", "jña"
184
- sub "න්‍ද", "nda"
185
-
186
174
  # numbers
187
175
  sub "\u0DE6", "0"
188
176
  sub "\u0DE7", "1"
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tam
5
5
  source_script: Gujr
6
6
  destination_script: Taml
7
- name: Romanization of Tamil -- UNGEGN 4.0 (1972)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Tamil Romanization Version 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_ta.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tel
5
5
  source_script: Telu
6
6
  destination_script: Latn
7
- name: Romanization of Telugu -- UNGEGN 4.0 (1972)
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Telugu Romanization, 1972
8
8
  url: https://www.eki.ee/wgrs/rom1_te.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ukr
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Romanization of Belarusian, Russian And Ukrainian Cyrillic (1998)
7
+ name: ROMANIZATION SYSTEM FOR BELARUSIAN, RUSSIAN AND UKRAINIAN CYRILLIC
8
8
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/7th-uncsgn-docs/econf/7th_UNCSGN_econf.91_3_Add1.pdf
9
9
  # page 320
10
10
  creation_date: 1998
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ukr
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Romanization of Belarusian, Russian And Ukrainian Cyrillic (2012)
7
+ name: ROMANIZATION SYSTEM FOR BELARUSIAN, RUSSIAN AND UKRAINIAN CYRILLIC
8
8
  url: http://www.eki.ee/wgrs/rom1_uk.htm
9
9
  creation_date: 2010
10
10
  }