interscript-maps 2.1.0 → 2.3.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (258) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +330 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-div-Thaa-Latn-2012.imp +74 -0
  18. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  19. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  21. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  23. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  25. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  26. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -4
  27. data/maps/alalc-kat-Geok-Latn-2011.imp +31 -0
  28. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -13
  29. data/maps/alalc-kat-Geor-Latn-2011.imp +52 -0
  30. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  31. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  32. data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
  33. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  34. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  35. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  36. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  37. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  38. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  39. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  40. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  41. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  42. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  43. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  45. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  46. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  47. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  48. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  49. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  50. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  51. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  52. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  53. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  54. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  55. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  56. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  57. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  58. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  59. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  60. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  61. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  62. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  63. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
  64. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
  65. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  66. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  67. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  68. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  69. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  70. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  71. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  72. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
  73. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
  74. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  75. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  76. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
  77. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  78. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  79. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  80. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  81. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  82. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  83. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  84. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  85. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  86. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  87. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  88. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  89. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  90. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  91. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  92. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  93. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +5 -5
  94. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +5 -5
  95. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  96. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  97. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  98. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  99. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  100. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  101. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  102. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  103. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  104. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  105. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  106. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  107. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  108. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  109. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  110. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  111. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  112. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  113. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  114. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  115. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  116. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  117. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  118. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  119. data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
  120. data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
  121. data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
  122. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
  123. data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
  124. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
  125. data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
  126. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
  127. data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
  128. data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
  129. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  130. data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
  131. data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
  132. data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
  133. data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
  134. data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
  135. data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
  136. data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
  137. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  138. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
  139. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  140. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  141. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
  142. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  143. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  144. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  145. data/maps/iso-ara-Arab-Latn-233-1984.imp +15 -15
  146. data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
  147. data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
  148. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  149. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
  150. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
  151. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
  152. data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
  153. data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
  154. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
  155. data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
  156. data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
  157. data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
  158. data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
  159. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
  160. data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
  161. data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
  162. data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
  163. data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
  164. data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
  165. data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
  166. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
  167. data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
  168. data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
  169. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +16 -16
  170. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
  171. data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
  172. data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
  173. data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
  174. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  175. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  176. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  177. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  178. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  179. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  180. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  181. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  182. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  183. data/maps/odni-ara-Arab-Latn-2004.imp +1 -2
  184. data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
  185. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  186. data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
  187. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  188. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
  189. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
  190. data/maps/odni-fas-Arab-Latn-2004.imp +14 -15
  191. data/maps/odni-fas-Arab-Latn-2015.imp +17 -17
  192. data/maps/odni-hin-Deva-Latn-2004.imp +20 -21
  193. data/maps/odni-hin-Deva-Latn-2015.imp +26 -27
  194. data/maps/odni-kat-Geor-Latn-2015.imp +3 -5
  195. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  196. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  197. data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
  198. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  199. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  200. data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
  201. data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
  202. data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
  203. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
  204. data/maps/odni-srp-Cyrl-Latn-2005.imp +1 -2
  205. data/maps/odni-srp-Cyrl-Latn-2015.imp +7 -9
  206. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  207. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  208. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
  209. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  210. data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
  211. data/maps/odni-urd-Arab-Latn-2015.imp +21 -22
  212. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
  213. data/maps/ses-ara-Arab-Latn-1930.imp +17 -60
  214. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  215. data/maps/un-ara-Arab-Latn-1971.imp +6 -6
  216. data/maps/un-ara-Arab-Latn-1972.imp +5 -5
  217. data/maps/un-ara-Arab-Latn-2017.imp +16 -16
  218. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  219. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  220. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  221. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  222. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  223. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  224. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  225. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  226. data/maps/un-hin-Deva-Latn-2016.imp +2 -2
  227. data/maps/un-kan-Kana-Latn-2016.imp +2 -2
  228. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  229. data/maps/un-mar-Deva-Latn-2016.imp +2 -2
  230. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  231. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  232. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  233. data/maps/un-nep-Deva-Latn-1972.imp +2 -2
  234. data/maps/un-nep-Deva-Latn-2013.imp +2 -2
  235. data/maps/un-ori-Orya-Latn-1972.imp +2 -2
  236. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  237. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  238. data/maps/un-rus-Cyrl-Latn-1987.imp +2 -2
  239. data/maps/un-sin-Sinh-Latn-1972.imp +16 -4
  240. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  241. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  242. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  243. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  244. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  245. data/maps/un-urd-Arab-Latn-1972.imp +16 -16
  246. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  247. data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
  248. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
  249. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
  250. data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
  251. data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
  252. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
  253. data/maps/var-mon-Mong-Latn-1930.imp +1 -1
  254. data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
  255. data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
  256. data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
  257. data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
  258. metadata +11 -1
@@ -4,12 +4,16 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of Geographical Names. Writing Systems and Guides to Pronunciation Romanization > Conversion of the Greek alphabet into Latin characters. Paper submitted by Greece and Cyprus.
7
+ name: Romanization of Greek 1.0 (Phonetic transcription)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
11
11
  UNGEGN Romanization table for Greek: Phonetic transcription
12
12
 
13
+ UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of
14
+ Geographical Names. Writing Systems and Guides to Pronunciation Romanization
15
+ > Conversion of the Greek alphabet into Latin characters. Paper submitted by
16
+ Greece and Cyprus.
13
17
 
14
18
  notes:
15
19
  - Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v4.0
7
+ name: Romanization of Greek -- UNGEGN 4.0 (transliteration)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -1,10 +1,10 @@
1
1
  metadata {
2
2
  authority_id: un
3
- id: 1987-tl
3
+ id: 1987-ts
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: UNGEGN Greek v4.0
7
+ name: Romanization of Greek -- UNGEGN 4.0 (transcription)
8
8
  url: http://www.eki.ee/wgrs/rom1_el.htm
9
9
  creation_date: 1987
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:guj
5
5
  source_script: Gujr
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Gujarati Romanization Version 4.0
7
+ name: Romanization of Gujarati -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_gu.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 2016
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
7
+ name: Romanization of Hindi -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 2016
4
4
  language: iso-639-2:kan
5
5
  source_script: Kana
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
7
+ name: Romanization of Kannada -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_kn.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mal
5
5
  source_script: Mlym
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Malayalam Romanization Version 4.0
7
+ name: Romanization of Malayalam -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_ml.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 2016
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Marathi Romanization, 1972
7
+ name: Romanization of Marathi -- UNGEGN 4.0
8
8
  url: https://www.eki.ee/wgrs/rom1_mr.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -0,0 +1,119 @@
1
+ metadata {
2
+ authority_id: id
3
+ id: 1977
4
+ language: iso-639-2:mkd
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Romanization of Macedonian geographical names (1977)
8
+ url: https://www.eki.ee/wgrs/v2_2/rom1_mk.htm
9
+ creation_date: 1977
10
+ description: |
11
+ The United Nations recommended system was approved in 1977 (III/11), based on the romanization of the Serbo-Croatian and Macedonian Cyrillic alphabets that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution (Third United Nations Conference on the Standardization of Geographical Names. Athens, 17 August - 7 September 1977. Vol. I. Report of the Conference, pp. 29, 31).
12
+ The system is used in The former Yugoslav Republic of Macedonia (see e.g. Report of The former Yugoslav Republic of Macedonia. Seventh United Nations Conference on the Standardization of Geographical Names. New York, 13-22 January 1998. Document E/CONF.91/CRP.23) and in international cartographic products.
13
+ The Cyrillic alphabet is used. The romanization table is unambiguous and can be applied automatically. The system is on the whole reversible with the exception of the characters ѓ and ќ. These are romanized as g and k, respectively, before е and и. But also г and к are occasionally used before е and и, so, for example, the name Makedonija is reconstituted as Македонија, not Маќедонија in the Cyrillic source script.
14
+ }
15
+
16
+ tests {
17
+ test "Маќедонија", "Makedonija"
18
+ test "Општина Ердут", "Opština Erdut"
19
+ test "Општина Двор", "Opština Dvor"
20
+ test "ЛУЃЕ луѓе", "LUGE luge"
21
+ test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
22
+ test "ЌАРУВАЊЕ ќарување", "ĆARUVANJE ćaruvanje"
23
+ }
24
+
25
+ dependency "posix", import: true
26
+
27
+ stage {
28
+ sub "Ѓ", "G", after: any("ЕИеи")
29
+ sub "ѓ", "g", after: any("ЕИеи")
30
+ sub "Ќ", "K", after: any("ЕИеи")
31
+ sub "ќ", "k", after: any("ЕИеи")
32
+
33
+ # CHARACTERS
34
+ parallel {
35
+ sub "А", "A"
36
+ sub "Б", "B"
37
+ sub "В", "V"
38
+ sub "Г", "G"
39
+ sub "Д", "D"
40
+ sub "Ѓ", "Đ" # Đ
41
+ sub "Е", "E"
42
+ sub "Ж", "Ž" # Ž
43
+ sub "З", "Z"
44
+ sub "Ѕ", "Dz"
45
+ sub "И", "I"
46
+ sub "Ј", "J"
47
+ sub "К", "K"
48
+ sub "Л", "L"
49
+ sub "Љ", "Lj"
50
+ sub "М", "M"
51
+ sub "Н", "N"
52
+ sub "Њ", "Nj"
53
+ sub "О", "O"
54
+ sub "П", "P"
55
+ sub "Р", "R"
56
+ sub "С", "S"
57
+ sub "Т", "T"
58
+ sub "Ќ", "Ć" # Ć
59
+ sub "У", "U"
60
+ sub "Ф", "F"
61
+ sub "Х", "H"
62
+ sub "Ц", "C"
63
+ sub "Ч", "Č" # Č
64
+ sub "Џ", "Dž" # Dž
65
+ sub "Ш", "Š" # Š
66
+ sub "а", "a"
67
+ sub "б", "b"
68
+ sub "в", "v"
69
+ sub "г", "g"
70
+ sub "д", "d"
71
+ sub "ѓ", "đ" # đ
72
+ sub "е", "e"
73
+ sub "ж", "ž" # ž
74
+ sub "з", "z"
75
+ sub "ѕ", "dz"
76
+ sub "и", "i"
77
+ sub "ј", "j"
78
+ sub "к", "k"
79
+ sub "л", "l"
80
+ sub "љ", "lj"
81
+ sub "м", "m"
82
+ sub "н", "n"
83
+ sub "њ", "nj"
84
+ sub "о", "o"
85
+ sub "п", "p"
86
+ sub "р", "r"
87
+ sub "с", "s"
88
+ sub "т", "t"
89
+ sub "ќ", "ć" # ć
90
+ sub "у", "u"
91
+ sub "ф", "f"
92
+ sub "х", "h"
93
+ sub "ц", "c"
94
+ sub "ч", "č" # č
95
+ sub "џ", "dž" # dž
96
+ sub "ш", "š" # š
97
+ }
98
+
99
+ # POSTRULES
100
+ # rewritten by hand to work properly
101
+ # DZ
102
+ sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
103
+ sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
104
+
105
+ #LJ
106
+ sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
107
+ sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
108
+
109
+ #NJ
110
+ sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
111
+ sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
112
+
113
+ #DŽ
114
+ sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
115
+ sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
116
+
117
+ compose
118
+ }
119
+
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Mongolian Romanization in China, Version 4.0 (general)
7
+ name: Romanization of Mongolian in China -- UNGEGN 4.0
8
8
  url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
9
  creation_date: 2013-09
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Mongolian Romanization in China, Version 4.0 (phonetic)
7
+ name: Romanization of Mongolian in China -- UNGEGN 4.0 (phonetic)
8
8
  url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
9
  creation_date: 2013-09
10
10
  description: |
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 1972
4
4
  language: iso-639-2:nep
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
7
+ name: Romanization of Nepali (1972)
8
8
  url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2010
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 2013
4
4
  language: iso-639-2:nep
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
7
+ name: Romanization of Nepali (2013)
8
8
  url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2013
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 1972
4
4
  language: iso-639-2:ori
5
5
  source_script: Orya
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Oriya Romanization, 1972
7
+ name: Romanization of Oriya (1972)
8
8
  url: http://www.eki.ee/wgrs/v2_2/rom1_or.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2003
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:pan
5
5
  source_script: Guru
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Panjabi Romanization Version 4.0
7
+ name: Romanization of Panjabi -- UNGEGN 4.0 (1972)
8
8
  url: https://www.eki.ee/wgrs/rom1_pa.htm
9
9
  creation_date: 1972
10
10
  confirmation_date: 2016
@@ -5,7 +5,7 @@ metadata {
5
5
  # prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
6
6
  source_script: Arab
7
7
  destination_script: Latn
8
- name: Persian UN 1967
8
+ name: Romanization of Persian (1967)
9
9
  url: http://www.eki.ee/wgrs/v2_2/rom1_fa.htm
10
10
  creation_date: 1967
11
11
  confirmation_date: 01-2003
@@ -130,20 +130,20 @@ stage {
130
130
 
131
131
  # NOTE 1
132
132
  # Sun letters
133
- sub boundary + "\u0627\u0644\u062a", "ot t" # الت
134
- sub boundary + "\u0627\u0644\u062b", "os̄ s̄" # الث
135
- sub boundary + "\u0627\u0644\u062f", "od d" # الد
136
- sub boundary + "\u0627\u0644\u0630", "oz̄ z̄" # الذ
137
- sub boundary + "\u0627\u0644\u0631", "or r" # الر
138
- sub boundary + "\u0627\u0644\u0632", "oz z" # الز
139
- sub boundary + "\u0627\u0644\u0633", "os s" # الس
140
- sub boundary + "\u0627\u0644\u0634", "osh sh" # الش
141
- sub boundary + "\u0627\u0644\u0635", "oş ş" # الص
142
- sub boundary + "\u0627\u0644\u0636", "oẕ ẕ" # الض
143
- sub boundary + "\u0627\u0644\u0637", "oţ ţ" # الط
144
- sub boundary + "\u0627\u0644\u0638", "oz̧ z̧" # الظ
145
- sub boundary + "\u0627\u0644\u0644", "ol l" # الل
146
- sub boundary + "\u0627\u0644\u0646", "on n" # الن
133
+ sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ot t" # الت
134
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "os̄ s̄" # الث
135
+ sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "od d" # الد
136
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "oz̄ z̄" # الذ
137
+ sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "or r" # الر
138
+ sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "oz z" # الز
139
+ sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "os s" # الس
140
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "osh sh" # الش
141
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "oş ş" # الص
142
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "oẕ ẕ" # الض
143
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "oţ ţ" # الط
144
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "oz̧ z̧" # الظ
145
+ sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ol l" # الل
146
+ sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "on n" # الن
147
147
 
148
148
  sub "\u0650\u064a\u0651", "īy" # ـِيَّ
149
149
  sub "\u0650\u064a", "iy", after: any("\u064e\u064f") # ـِي kasra followed by ي
@@ -1,10 +1,10 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 1987
4
4
  language: iso-639-2:rus
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Russian Romanization system
7
+ name: Romanization of Russian (1987)
8
8
  url: http://www.eki.ee/wgrs/rom1_ru.htm
9
9
  creation_date: 1987
10
10
  confirmation_date: 2016
@@ -4,7 +4,8 @@ metadata {
4
4
  language: iso-639-2:sin
5
5
  source_script: Sinh
6
6
  destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Sinhalese Romanization Version 4.0
7
+ name: Romanization of Sinhalese -- UNGEGN 4.0 (1972)
8
+ source: "Second United Nations Conference on the Standardization of Geographical Names. London, 10–31 May 1972. Vol. II. Technical papers, pp. 151–152."
8
9
  url: https://www.eki.ee/wgrs/rom1_ml.htm
9
10
  creation_date: 1972
10
11
  confirmation_date: 2016
@@ -18,7 +19,6 @@ metadata {
18
19
  Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
19
20
  abbreviated form, to denote vowels after consonants.
20
21
 
21
-
22
22
  notes:
23
23
  - |
24
24
  The character ඇ was romanized as a͝i and the character ඈ as ai in Sharma's table, but there was no romanization for the character ඓ which,
@@ -37,13 +37,13 @@ metadata {
37
37
 
38
38
  tests {
39
39
  test "ශී‍්‍ර ලංකාවේ කී‍්‍රඩාව ඉතිහාසයේ ඉහළම තැනකට ගේන්න කටයුතු කරනවා", "shīra laṁkāve kīraḍāva itihāsaye ihaḷama tæ̆nakaṭa genna kaṭayutu karanavā"
40
- test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaඬe moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
40
+ test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaṇḍae moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
41
41
  test "ලෝක ළමා දිනයදා සිසුන් පිරිසක් කසිප්පු බීලා", "loka ḷamā dinayadā sisun pirisak kasippu bīlā"
42
42
  test "කෝටි 16ක හෙරොයින් සමග දන්කොටුවේදී 7ක් දැලේ", "koṭi 16ka hĕrŏyin samaga dankŏṭuvedī 7k dæ̆le"
43
43
  test "මිනුවන්ගොඩ පීසීආර් දෙදහසක් සිදුකරයි", "minuvangŏḍa pīsīār dĕdahasak sidukarayi"
44
44
  test "පාස්කු ප‍්‍රහාරය වගේම පාස්කු ප්‍රෝඩාව ගැනත් සොයන්න කොමිසමක් පත්කළ යුතුයි - විපක්‍ෂ නායක සජිත් පේ‍්‍රමදාස", "pāsku parahāraya vagema pāsku proḍāva gæ̆nat sŏyanna kŏmisamak patkaḷa yutuyi - vipakṣha nāyaka sajit peramadāsa"
45
45
  test "ට‍්‍රම්ප්ගේ සෞඛ්‍යය තීරණාත්මකයි - ට්විටර් හරහා ජනතාව අමතයි", "ṭarampge saukhyaya tīraṇātmakayi - ṭviṭar harahā janatāva amatayi"
46
- test "පාස්කු දා ප‍්‍රහාරය පිළිබඳ පරීක්‍ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibaඳ parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
46
+ test "පාස්කු දා ප‍්‍රහාරය පිළිබඳ පරීක්‍ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibanda parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
47
47
  test "දිල්ලි කැපිටල්ස් සහ කෝලිගේ බැංගලෝර් තෙවැනි ජය ලබයි", "dilli kæ̆piṭals saha kolige bæ̆ṁgalor tĕvæ̆ni jaya labayi"
48
48
  test "ශ‍්‍රී ලාංකික සම්භවයක් සහිත ප‍්‍රංශයේ පවුලක 5 ක් ඝාතනය කරලා", "sharī lāṁkika sambhavayak sahita paraṁshaye pavulaka 5 k ghātanaya karalā"
49
49
  test "පැතිකුදය ඉක්මනින් සුව කරන ප‍්‍රතිකාර", "pæ̆tikudaya ikmanin suva karana paratikāra"
@@ -171,6 +171,18 @@ stage {
171
171
  sub "ෆ", "fa"
172
172
  sub "ළ", "ḷa"
173
173
 
174
+ # Prenasalized sounds
175
+ sub "ඟ", "ṅga"
176
+ sub "ඦ", "ñja"
177
+ sub "ඬ", "ṇḍa"
178
+ sub "ඳ", "nda"
179
+ sub "ඹ", "mba"
180
+
181
+ # Other ligatures
182
+ sub "ක්", "k"
183
+ sub "ඥ", "jña"
184
+ sub "න්", "n"
185
+
174
186
  # numbers
175
187
  sub "\u0DE6", "0"
176
188
  sub "\u0DE7", "1"
@@ -0,0 +1,47 @@
1
+ metadata {
2
+ authority_id: un
3
+ id: 1997
4
+ language: iso-639-2:srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Romanization of Serbo-Crotian (1972)
8
+ url: http://www.eki.ee/wgrs/rom1_sr.htm
9
+ creation_date: 1997
10
+ description: |
11
+ The United Nations recommended system was approved in 1977 (III/11), based on the Roman equivalent of the Serbo-Croatian Cyrillic alphabet that had long been employed in official gazetteers and maps of Yugoslavia. The table was published as an annex to the resolution1. The term relating to the language (Serbian instead of Serbo-Croatian) was modified in 2002 (resolution VIII/14).
12
+ The system is used in Serbia, Montenegro, and Bosnia and Herzegovina. It is also used in international cartographic products.
13
+ Serbian uses the Cyrillic script that is alphabetic. The romanization table is unambiguous and can be applied automatically. The system is reversible.
14
+ }
15
+
16
+ tests {
17
+ test "Шупља Стена", "Šuplja Stena"
18
+ test "Чукарица", "Čukarica"
19
+ test "Црна Трава", "Crna Trava"
20
+ test "Херцег Нови", "Herceg Novi"
21
+ test "Улцињ", "Ulcinj"
22
+ test "Ужице", "Užice"
23
+ test "Тресаначка Река", "Tresanačka Reka"
24
+ test "Сјеница", "Sjenica"
25
+ test "Рожаје", "Rožaje"
26
+ test "Пљевља", "Pljevlja"
27
+ test "Оџаци", "Odžaci"
28
+ test "Никшић", "Nikšić"
29
+ test "Медвеђа", "Medveđa"
30
+ test "Лозница", "Loznica"
31
+ test "Књажевац", "Knjaževac"
32
+ test "Зрењанин", "Zrenjanin"
33
+ test "Житорађа", "Žitorađa"
34
+ test "Ервеник", "Ervenik"
35
+ test "Доње Љупче", "Donje Ljupče"
36
+ test "Гусиње", "Gusinje"
37
+ test "ГУСИЊЕ", "GUSINJE"
38
+ test "Врњачка Бања", "Vrnjačka Banja"
39
+ test "Бијело Поље", "Bijelo Polje"
40
+ test "Алибунар", "Alibunar"
41
+ }
42
+
43
+ dependency "alalc-srp-Cyrl-Latn-2013", as: srpalatn
44
+
45
+ stage {
46
+ run map.srpalatn.stage.main
47
+ }