interscript 0.1.3 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (294) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +10 -11
  3. data/aliases.json +1 -0
  4. data/lib/interscript.rb +62 -59
  5. data/lib/interscript/command.rb +3 -2
  6. data/lib/interscript/fs.rb +96 -0
  7. data/lib/interscript/mapping.rb +36 -17
  8. data/lib/interscript/opal.rb +196 -0
  9. data/lib/interscript/opal/entrypoint.rb +20 -0
  10. data/lib/interscript/opal/exports.rb +11 -0
  11. data/lib/interscript/opal/maps.js.erb +8 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/maps/acadsin-zho-Hani-Latn-2002.yaml +6 -2
  14. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  15. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  16. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  17. data/maps/alalc-asm-Deva-Latn-1997.yaml +259 -0
  18. data/maps/alalc-asm-Deva-Latn-2012.yaml +55 -0
  19. data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
  20. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  21. data/maps/{alalc-bel-cyrl-latn-1997.yaml → alalc-bel-Cyrl-Latn-1997.yaml} +7 -3
  22. data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  25. data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
  26. data/maps/alalc-ell-Grek-Latn-1997.yaml +7 -4
  27. data/maps/alalc-ell-Grek-Latn-2010.yaml +3 -5
  28. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  29. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  30. data/maps/alalc-hin-Deva-Latn-1997.yaml +303 -0
  31. data/maps/alalc-hin-Deva-Latn-2011.yaml +65 -0
  32. data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
  33. data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
  34. data/maps/alalc-kat-Geok-Latn-1997.yaml +2 -3
  35. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  36. data/maps/alalc-kor-Hang-Latn-1997.yaml +6 -2
  37. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  38. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  39. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  40. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  41. data/maps/{alalc-mkd-cyrl-latn-1997.yaml → alalc-mkd-Cyrl-Latn-1997.yaml} +1 -1
  42. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  43. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  44. data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
  45. data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
  46. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  47. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  48. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  49. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  50. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  51. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  52. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  53. data/maps/alalc-san-Deva-Latn-2012.yaml +241 -0
  54. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  55. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  56. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  57. data/maps/{alalc-srp-cyrl-latn-2013.yaml → alalc-srp-Cyrl-Latn-2013.yaml} +1 -1
  58. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  59. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  60. data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
  61. data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
  62. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  63. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  64. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  65. data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
  66. data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
  67. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -2
  68. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  69. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -3
  70. data/maps/bgn-kor-Hang-Latn-1943.yaml +8 -4
  71. data/maps/bgn-kor-Kore-Latn-1943.yaml +4 -4
  72. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  73. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  75. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +598 -0
  76. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  77. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
  78. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  79. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
  80. data/maps/{bgnpcgn-bel-cyrl-latn-1979.yaml → bgnpcgn-bel-Cyrl-Latn-1979.yaml} +5 -1
  81. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +14 -10
  82. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  83. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  84. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
  85. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +8 -5
  86. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -2
  87. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
  88. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  89. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
  90. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  91. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  92. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -2
  93. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
  94. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
  95. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +18 -18
  96. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +3 -3
  97. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +3 -3
  98. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
  99. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  100. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +2 -2
  101. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  102. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  103. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +338 -0
  104. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +673 -0
  105. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  106. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
  107. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  108. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  109. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
  110. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  111. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  112. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  113. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -2
  114. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  115. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
  116. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  117. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  118. data/maps/{bgnpcgn-chn-Hans-Latn-1979.yaml → bgnpcgn-zho-Hans-Latn-1979.yaml} +1 -1
  119. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  120. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  121. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  122. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  123. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +173 -0
  124. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  125. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +175 -0
  126. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  127. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  128. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  129. data/maps/by-bel-Cyrl-Latn-1998.yaml +9 -5
  130. data/maps/by-bel-Cyrl-Latn-2007.yaml +4 -4
  131. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  132. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  133. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  134. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  135. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  136. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  137. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  138. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  139. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  140. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  141. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +7 -8
  142. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +6 -7
  143. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -3
  144. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -3
  145. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -2
  146. data/maps/{gki-bel-cyrl-latn-1992.yaml → gki-bel-Cyrl-Latn-1992.yaml} +2 -2
  147. data/maps/{gki-bel-cyrl-latn-2000.yaml → gki-bel-Cyrl-Latn-2000.yaml} +2 -2
  148. data/maps/{gost-rus-cyrl-latn-16876-71-1983.yaml → gost-rus-Cyrl-Latn-16876-71-1983.yaml} +8 -4
  149. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  150. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  151. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -6
  152. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -5
  153. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -2
  154. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  155. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  156. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  157. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  158. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  159. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  160. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  161. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  162. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +11 -8
  163. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -5
  164. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  165. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  166. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  167. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  168. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +220 -0
  169. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  170. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  171. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  172. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  173. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  174. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  175. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  176. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  177. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  178. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  179. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  180. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  181. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  182. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  183. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -4
  184. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  185. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  186. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  187. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +2 -2
  188. data/maps/kp-kor-Hang-Latn-2002.yaml +29 -21
  189. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +3 -3
  190. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  191. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  192. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  193. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  194. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  195. data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
  196. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  197. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  198. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  199. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  200. data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
  201. data/maps/odni-ara-Arab-Latn-2015.yaml +315 -0
  202. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  203. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  204. data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
  205. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  206. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  207. data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
  208. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  209. data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
  210. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  211. data/maps/odni-kat-Geor-Latn-2015.yaml +2 -3
  212. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  213. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  214. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  215. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
  216. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  217. data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
  218. data/maps/odni-prs-Arab-Latn-2015.yaml +228 -0
  219. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  220. data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
  221. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  222. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  223. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  224. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
  225. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  226. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +6 -2
  227. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  228. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  229. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +5 -5
  230. data/maps/royin-tha-Thai-Latn-1968.yaml +9 -5
  231. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +5 -5
  232. data/maps/royin-tha-Thai-Latn-1999.yaml +8 -4
  233. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  234. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  235. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  236. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  237. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  238. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  239. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  240. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  241. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  242. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  243. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  244. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  245. data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
  246. data/maps/un-bel-Cyrl-Latn-2007.yaml +4 -4
  247. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  248. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +44 -44
  249. data/maps/un-ell-Grek-Latn-1987-tl.yaml +3 -4
  250. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -4
  251. data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
  252. data/maps/un-hin-Deva-Latn-2016.yaml +316 -0
  253. data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
  254. data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
  255. data/maps/un-mar-Deva-Latn-2016.yaml +102 -0
  256. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  257. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  258. data/maps/un-nep-Deva-Latn-1972.yaml +269 -0
  259. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  260. data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
  261. data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
  262. data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
  263. data/maps/un-rus-Cyrl-Latn-1987.yaml +2 -2
  264. data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
  265. data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
  266. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  267. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  268. data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
  269. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
  270. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
  271. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  272. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  273. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  274. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +4 -4
  275. data/maps/var-kor-Hang-Latn-mr-1939.yaml +4 -4
  276. data/maps/var-kor-Kore-Hang-2013.yaml +2 -2
  277. data/maps/var-kor-Kore-Latn-mr-1939.yaml +2 -3
  278. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  279. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  280. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  281. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  282. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  283. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  284. data/maps/var-tha-Thai-Thai-phonemic.yaml +6 -6
  285. data/maps/var-tha-Thai-Zsym-ipa.yaml +13 -13
  286. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +13 -9
  287. data/spec/interscript/filenames_spec.rb +21 -0
  288. data/spec/interscript_spec.rb +16 -5
  289. metadata +275 -27
  290. data/bin/interscript +0 -41
  291. data/bin/rspec +0 -29
  292. data/bin/setup +0 -8
  293. data/maps/un-mon-Mong-Latn-2013.yaml +0 -93
  294. data/maps/un-ukr-cyrl-latn-1998.yaml +0 -30
@@ -0,0 +1,354 @@
1
+ ---
2
+ authority_id: sasm
3
+ id: phonetic-1978
4
+ language: iso-639-2:mon
5
+ source_script: Mong
6
+ destination_script: Latn
7
+ name: Transliteration of Place Names in Minority Languages in Chinese Pinyin (Mongolian, phonetic)
8
+ url: http://www.moe.gov.cn/ewebeditor/uploadfile/2015/01/12/20150112161436994.pdf
9
+ creation_date: 1976-06
10
+ description: |
11
+ Article 1
12
+
13
+ The main purpose of the transliteration method of Chinese pinyin
14
+ letter transliteration of place names in minority languages:
15
+
16
+ (1) As a standard for spelling place names in minority languages ​​
17
+ with Chinese phonetic alphabet;
18
+ (2) As a phonetic tool for surveying and recording ethnic place
19
+ names in map surveying and mapping work;
20
+ (3) As the main basis for the pronunciation and selection of place
21
+ names in ethnic minority languages ​​in Chinese character
22
+ transliteration;
23
+ (4) Provide convenient conditions for the unified compilation of my
24
+ country's place-name information and index in alphabetical order.
25
+
26
+ Article 2
27
+
28
+ The transliteration method is limited to the 26 letters in the
29
+ "Hanyu Pinyin Plan", two letters with additional symbols and a
30
+ sound-proof symbol. In order to make the transcription and phonetic
31
+ more accurate, the syllable structure can not be restricted by the
32
+ syllable form of Mandarin Chinese. Soundproof symbols can be used
33
+ in various occasions that are easy to be confused. When recording,
34
+ additional symbols can be added to specific letters to represent
35
+ special sounds.
36
+
37
+ The transliteration and transliteration of ethnic minority scripts
38
+ in Latin script shall be based on the script. Letters with the same
39
+ or similar pronunciation and usage as in the "Hanyu Pinyin Plan"
40
+ shall be written according to them; different or dissimilar letters
41
+ shall be transcribed separately. If the text does not use Latin
42
+ letters, the corresponding Chinese phonetic letters shall be used
43
+ according to the pronunciation of the text. If there is no text,
44
+ according to the general voice mark.
45
+
46
+ Article 3
47
+
48
+ Special place names are handled with reference to the following
49
+ methods:
50
+
51
+ (1) If the commonly used Chinese name is partly transliterated and
52
+ partly translated, the transliteration part is spelled according to
53
+ the transliteration method, and the free translation part is
54
+ spelled according to the pronunciation of the Chinese character.
55
+
56
+ (2) If the commonly used Chinese character translation is a section
57
+ translation, the actual situation may be considered. Some are
58
+ transliterated according to the full name of the original name, and
59
+ some are spelled according to the Hanyu pronunciation of the
60
+ section translation.
61
+
62
+ (3) If the translated name of a Chinese character originally came
63
+ from a minority language, but later became a Chinese form and has
64
+ been commonly used, it can be spelled according to the
65
+ pronunciation of the Chinese character, including the original name
66
+ transliterated if necessary.
67
+
68
+ (4) Other special circumstances shall be dealt with according to
69
+ specific discretion.
70
+
71
+ original_description: |
72
+ 第一条
73
+
74
+ 少数民族语地名汉语拼音字母音译转写法的主要用途:
75
+
76
+ (1) 作为用汉语拼音字母拼写少数民族语地名的标准;
77
+ (2)作为地图测绘工作中调査记录少数民族语地名的记音工具;
78
+ (3) 作为汉字音译少数民族语地名定音和选字的主要依据;
79
+ (4)为按照字母颐序统一编排我国地名资料和索引提供便利条件。
80
+
81
+ 第二条
82
+
83
+ 音译转写法限用《汉语拼音方案》中的26个字母,两个有附加符号的字母和一
84
+ 个隔音符号,为了使转写和记音比较准确,音节结构可以不受汉语普通话音节
85
+ 形式的限制,隔音符号可以在各种
86
+ 容易混淆的场合应用,记音的时候附加符号可以加在特定的字母上面代表特殊
87
+ 语音。
88
+
89
+
90
+ 少数民族文字用拉丁字母的,音译转写以其文字为依据。跟《汉语拼音方案》
91
+ 中读音和用法相同或相近的字母,一律照写;不同或不相近的字母分别规定转
92
+ 写方式,文字不用拉丁字母的,根据文字的读音采用相应的汉语拼音字母表示
93
+ 。没有文字的,根据通用语音标记。
94
+
95
+ 第三条
96
+
97
+ 特殊的地名参照下列办法处理:
98
+
99
+
100
+ (1)惯用的汉字译名如果是一部分音译,一部分意译,其音译部分根据音译转
101
+ 写法拼写,意译部分按照汉字读音拼写。
102
+
103
+
104
+ (2)惯用的汉字译名如果是节译,可以斟酌具体体情况,有的按照原名全称音
105
+ 译转写,有的按照节译的汉宇读音拼写。
106
+
107
+ (3) 汉字译名如果原先来自少数民族语,后来变成汉语形式并且已经通用,可以按
108
+ 照汉字读音拼写,必要时括注音译转写的原名。
109
+
110
+ (4) 其他特殊情况具体斟酌处理。
111
+
112
+ notes:
113
+ - The transliteration of Mongolian place names is based on the
114
+ customary pronunciation combining written and spoken languages.
115
+ - The length of Mongolian vowels are generally spelled regardless
116
+ of their spelling. Long vowels in place names are represented by
117
+ double letters.
118
+ - The Chinese phonetic alphabets transliterated by transliteration
119
+ are juxtaposed with or without symbols and adjuncts. Normally, the
120
+ spelling letters are without symbols, and the place names are
121
+ recorded by the acronym.
122
+
123
+ original_notes:
124
+ (1) 蒙古语地名的音译转写,以书面语和口语通用相结合的习惯读法为依据。
125
+ (2) 蒙古语元音的长短,一般拼写不分,地名记音中长元音用双字母表示。
126
+ (3) 音译转写的汉语拼音字母有无符和加符并列的,一般拼写用无符字母,地名记音用加符宇母。
127
+
128
+ implementation_notes:
129
+ - A separated final form of vowels a or e is common, and can appear at the end
130
+ of a word, word stem, or suffix. This form requires a final-shaped preceding
131
+ consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
132
+ and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
133
+ with a hyphen. In digital typesetting, these forms are triggered by inserting
134
+ a U+180E ᠎ MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
135
+ and vowel.
136
+ - All case suffixes, as well as any plural suffixes consisting of one or two
137
+ syllables are likewise separated by a preceding and hyphen-transliterated gap.
138
+ In digital typesetting, this gap is represented by a U+202F   NARROW NO-BREAK SPACE
139
+ (HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
140
+ Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
141
+ as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
142
+ 'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
143
+ medial- (vowels), or variant-shaped form.
144
+
145
+ tests:
146
+ - source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
147
+ expected: ôrdôs hôta
148
+ - source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
149
+ expected: bayannagûr hôta
150
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
151
+ expected: ûlaganhôta
152
+ - source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
153
+ expected: hôôlia gôûl hôta
154
+ - source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
155
+ expected: eriyen hôta
156
+ - source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
157
+ expected: rasiyan hôta
158
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
159
+ expected: bagarin baragûn hôsigû
160
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
161
+ expected: bagarin jegun hôsigû
162
+ - source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
163
+ expected: tungliyôû hôta
164
+ - source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
165
+ expected: sili-yin hôta
166
+ - source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
167
+ expected: hôrin ger siyan
168
+ - source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
169
+ expected: ûda tôgôrig
170
+ - source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
171
+ expected: uhai hôta
172
+ - source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
173
+ expected: hayinan tôgôrig
174
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
175
+ expected: hayirûb-ûn tôhôi tôgôrig
176
+ - source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
177
+ expected: ûlaganqab hôta
178
+ - source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
179
+ expected: jining tôgôrig
180
+ - source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
181
+ expected: fwngjwe hôta
182
+ - source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
183
+ expected: juwezi siyan
184
+ - source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
185
+ expected: hûwade siyan
186
+ - source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
187
+ expected: xangdû siyan
188
+ - source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
189
+ expected: singhe siyan
190
+ - source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
191
+ expected: liyangqang siyan
192
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
193
+ expected: qahar baragûn garûn emunedu hôsigû
194
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
195
+ expected: qahar baragûn garûn dûmdadû hôsigû
196
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
197
+ expected: qahar baragûn garûn hôyitû hôsigû
198
+ - source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
199
+ expected: dorbed hôsigû
200
+ - source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
201
+ expected: bûgûtû hôta
202
+ - source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
203
+ expected: hondelen tôgôrig
204
+ - source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
205
+ expected: dunghe tôgôrig
206
+ - source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
207
+ expected: qingxan tôgôrig
208
+ - source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
209
+ expected: sigûyitû tôgôrig
210
+ - source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
211
+ expected: jiu yûwan tôgôrig
212
+ - source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
213
+ expected: guyang siyan
214
+ - source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
215
+ expected: tumed jegun hôsigû
216
+ - source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
217
+ expected: tumed baragûn hôsigû
218
+ - source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
219
+ expected: darhan mûûmingg᠋an hôlbôgatû hôsigû
220
+ - source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
221
+ expected: hesigten hôsigû
222
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
223
+ expected: sin-e bargû jegun hôsigû
224
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
225
+ expected: sin-e bargû baragûn hôsigû
226
+ - source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
227
+ expected: ôtôg hôsigû
228
+ - source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
229
+ expected: d᠋ungxeng tôgôrig
230
+ - source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
231
+ expected: dalad hôsigû
232
+ - source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
233
+ expected: jegungar hôsigû
234
+ - source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
235
+ expected: ôtôg-ûn emunedu hôsigû
236
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
237
+ expected: hanggin hôsigû
238
+ - source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
239
+ expected: uusin hôsigû
240
+ - source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
241
+ expected: ejin hôrôg-a hôsigû
242
+ - source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
243
+ expected: jalan ai᠌l hôta
244
+ - source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
245
+ expected: yagsi hôta
246
+ - source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
247
+ expected: manjûûr hôta
248
+ - source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
249
+ expected: hayilar tôgôrig
250
+ - source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
251
+ expected: hôrqin tôgôrig
252
+ - source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
253
+ expected: kayilu siyan
254
+ - source: ᠬᠦᠷᠢᠶ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
255
+ expected: huriy-e hôsigû
256
+ - source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
257
+ expected: naiman hôsigû
258
+ - source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
259
+ expected: jarûd hôsigû
260
+ - source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
261
+ expected: hôrqin baragûn garûn dûmdadû hôsigû
262
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
263
+ expected: hôrqin jegun garûn dûmdadû hôsigû
264
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
265
+ expected: hôrqin jegun garûn hôyitû hôsigû
266
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
267
+ expected: ûlaganhada hôta
268
+ - source: ᠰᠡᠷᠡᠴᠢ # Salaqi
269
+ expected: sereqi
270
+ - source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
271
+ expected: gegen gôûl hôta
272
+ - source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
273
+ expected: alaxa jegun hôsigû
274
+ - source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
275
+ expected: alaxa baragûn hôsigû
276
+ - source: ᠡᠵᠡᠨ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
277
+ expected: ejen-e hôsigû
278
+ - source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
279
+ expected: hobegetu sir-a hôsigû
280
+ - source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
281
+ expected: uyûwan siyan
282
+ - source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
283
+ expected: uqûwan siyan
284
+ - source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
285
+ expected: tuqiûwan siyan
286
+ - source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
287
+ expected: ningqeng siyan
288
+ - source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
289
+ expected: linsi siyan
290
+ - source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
291
+ expected: linhe tôgôrig
292
+ - source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
293
+ expected: haraqin hôsigû
294
+ - source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
295
+ expected: d᠋engkeu siyan
296
+ - source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
297
+ expected: aûhan hôsigû
298
+ - source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
299
+ expected: qing xui he siyan
300
+ - source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
301
+ expected: hôdông arad-ûn tôgôrig
302
+ - source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
303
+ expected: sayihan tôgôrig
304
+ - source: ᠰᠢᠨ᠎ᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
305
+ expected: sin-e hôta tôgôrig
306
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
307
+ expected: hayirûb-ûn tôhôi tôgôrig
308
+ - source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
309
+ expected: sung xan tôgôrig
310
+ - source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
311
+ expected: hung xan tôgôrig
312
+ - source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
313
+ expected: arûn hôsigû
314
+ - source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
315
+ expected: yûwan bôô xan tôgôrig
316
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
317
+ expected: silûgûn hobegetu qagan hôsigû
318
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
319
+ expected: silûgûn hohe hôsigû
320
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
321
+ expected: ûrad-ûn dûmdadû hôsigû
322
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
323
+ expected: ûrad-ûn emunedu hôsigû
324
+ - source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
325
+ expected: tôgtahû siyan
326
+ - source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
327
+ expected: tayipûse hôsigû
328
+ - source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
329
+ expected: soned jegun hôsigû
330
+ - source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
331
+ expected: soned baragûn hôsigû
332
+ - source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
333
+ expected: ôngnigûd hôsigû
334
+ - source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
335
+ expected: jalaid hôsigû
336
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
337
+ expected: hanggin hôyitû hôsigû
338
+ - source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
339
+ expected: jegun ûjûmûqin hôsigû
340
+ - source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
341
+ expected: arû hôrqin hôsigû
342
+ - source: ᠠᠪᠠᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
343
+ expected: abag-a hôsigû
344
+ - source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
345
+ expected: bûriyad
346
+ - source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
347
+ expected: ûlaganbagatûr
348
+
349
+ map:
350
+ inherit: sasm-mon-Mong-Latn-general-1978
351
+
352
+ characters:
353
+ "ᠣ": "ô" # For place names
354
+ "ᠤ": "û" # For place names
@@ -0,0 +1,283 @@
1
+ ---
2
+ authority_id: ungegn
3
+ id: 1930
4
+ language: iso-639-2:ara
5
+ source_script: Arab
6
+ destination_script: Latn
7
+ alias:
8
+ ogc11122:
9
+ code: ara_Arab2Latn_SES_1930
10
+ description: Arabic Survey of Egypt System
11
+ name: ROMANIZATION OF ARABIC -- UNGEGN 2017 System
12
+ url: http://www.eki.ee/wgrs/rom1_ar.pdf
13
+ creation_date: 1930
14
+ confirmation date: 2018-06
15
+ description: |
16
+ The current United Nations recommended romanization
17
+ system was approved in 2017 (resolution XI/3), based on
18
+ the system adopted by Arabic experts at the conference
19
+ held in Beirut in 2007, the Unified Arabic
20
+ Transliteration System, taking into account the
21
+ practical amendments and corrections carried out and
22
+ agreed upon by the representatives of the Arabic-
23
+ speaking countries at the Fourth Arab Conference on
24
+ Geographical Names, held in Beirut in 2008, and some
25
+ clarifications and amendments agreed in Riyadh in 20171.
26
+ Previously, the United Nations had approved a
27
+ romanization system in 1972 (resolution II/8), based on the
28
+ system adopted by Arabic experts at the conference
29
+ held at Beirut in 1971 with the practical amendments carried out
30
+ and agreed upon by the representatives of the Arabic-speaking
31
+ countries at their conference. The table was published in volume
32
+ II of the conference report.
33
+ In UN resolution XI/3 it is specifically stated that the
34
+ system was recommended for the “romanization of the
35
+ geographical names within those Arabic-speaking countries
36
+ where this system is officially adopted”. There is
37
+ evidence of its partial implementation in Jordan, Oman and
38
+ Saudi Arabia. The UNGEGN Working Group on Romanization
39
+ Systems intends to continue monitoring the UN system’s
40
+ implementation across Arabic-speaking countries.
41
+ In some countries there exist local romanization schemes
42
+ or practices. The geographical names of Algeria, Djibouti,
43
+ Mauritania, Morocco and Tunisia are generally rendered in
44
+ the traditional manner which conforms to the principles of
45
+ the French orthography.
46
+ The previous UN-approved system is still found in
47
+ considerable international usage.
48
+ Arabic is written from right to left. The Arabic script
49
+ usually omits vowel points and diacritical marks from
50
+ writing which makes it difficult to obtain uniform results
51
+ in the romanization of Arabic. It is essential to identify
52
+ correctly the words which appear in any particular name
53
+ and to know the standard Arabic-script spelling including
54
+ the relevant vowels. One must also take into account
55
+ dialectal and idiosyncratic deviations. The romanization
56
+ is generally reversible though there may be some ambiguous
57
+ letter sequences (dh, kh, sh, th) which may also point to
58
+ combinations of Arabic characters in addition to the
59
+ respective single characters.
60
+ notes:
61
+ - |
62
+ The Survey of Egypt System (SES) of romanization has the following correspondences with
63
+ the UN system:
64
+ á = a # ـَى fatha followed by ى which is ا not ي
65
+ ā = â (a) # ـَا fatha followed by alef // آ
66
+ -ah (ة- = (a # ة ta' marboota at the end of a sentence
67
+ aw = ô (au) # ـَوْ
68
+ ay = ei (ai) # ـَيْ
69
+ ḏ = ḍ # ض
70
+ dh = dh (z) # ذ
71
+ d͟h = ẓ (d) # ظ
72
+ ẖ = ḥ # ح
73
+ ī = î
74
+ j = g (j)
75
+ q = q (k)
76
+ s = s (c)
77
+ s̱ = ṣ
78
+ ṯ = ṭ
79
+ th = th (t)
80
+ ū = û
81
+ ‘ = ‛
82
+ - |
83
+ The variants in parentheses are used depending on pronunciation and tradition. Not all the
84
+ variations have been given above. The article is always written el- (El-Kafr el-Qadîm, Sharm
85
+ el-Sheikh).
86
+ tests:
87
+
88
+ # Examples taken from:
89
+ # https://unstats.un.org/unsd/geoinfo/geonames/
90
+
91
+ - source: شَرم الشَيْخ
92
+ expected: Sharm el-Sheikh
93
+
94
+ - source: الكَفر القَدِيم
95
+ expected: El-Kafr el-Qadîm
96
+ map:
97
+ inherit: "un-ara-Arab-Latn-2017"
98
+ postrules:
99
+ - pattern : ' El-' # الص
100
+ result: ' el-'
101
+
102
+ characters:
103
+
104
+
105
+ # special pointed letters
106
+ '\u0639\u064e' : '‛a' # عَ
107
+ '\u0639\u0650' : '‛i' # عِ
108
+ '\u0639\u064f' : '‛û' # عُ
109
+ # handle MacOS regex difference
110
+ '\u0639\u064f\u0648' : '‛û' # عُو damma followed by و
111
+ '\u0650\u064a' : 'î' # ـِي kasra followed by ي
112
+ '\u0650\u064a\u0651\u064e' : 'îy' # ـِيَّ
113
+ '\u064f\u0648' : 'û' # ـُو damma followed by و
114
+ '\u064e\u0627' : # ـَا fatha followed by ا
115
+ - 'â'
116
+ - 'a'
117
+ '\u064e\u0649' : 'a' # ـَى fatha followed by ى which is ا not ي
118
+ '\u064e\u0648\u0652' : # ـَوْ
119
+ - 'ô'
120
+ - 'au'
121
+ '\u064e\u064a\u0652' : # ـَيْ
122
+ - 'ei'
123
+ - 'ai'
124
+ '\u0622' : # آ
125
+ - 'â'
126
+ - 'a'
127
+
128
+ # ta' marboota in iso-233-1984 is all the same `a`
129
+ '\u0629$' : 'a'
130
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{2})\u0629' : 'a'
131
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{3})\u0629' : 'a'
132
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{4})\u0629' : 'a'
133
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{5})\u0629' : 'a'
134
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{6})\u0629' : 'a'
135
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{7})\u0629' : 'a'
136
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{8})\u0629' : 'a'
137
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{9})\u0629' : 'a'
138
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{10})\u0629' : 'a'
139
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{11})\u0629' : 'a'
140
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{12})\u0629' : 'a'
141
+ '(?<=\b\u0627\u0644[\u0600-\u06ff]{13})\u0629' : 'a'
142
+
143
+
144
+ # Sun letters
145
+ '\b\u0627\u0644\u062a' : 'el-t' # الت
146
+ '\b\u0627\u0644\u062b' : # الث
147
+ - 'el-th'
148
+ - 'el-t'
149
+ '\b\u0627\u0644\u062f' : 'el-d' # الد
150
+ '\b\u0627\u0644\u0630' : # الذ
151
+ - 'el-dh'
152
+ - 'el-z'
153
+ '\b\u0627\u0644\u0631' : 'el-r' # الر
154
+ '\b\u0627\u0644\u0632' : 'el-z' # الز
155
+ '\b\u0627\u0644\u0633' : # الس
156
+ - 'el-s'
157
+ - 'el-c'
158
+ '\b\u0627\u0644\u0634' : 'el-sh' # الش
159
+ '\b\u0627\u0644\u0635' : 'el-ṣ' # الص
160
+ '\b\u0627\u0644\u0636' : 'el-ḍ' # الض
161
+ '\b\u0627\u0644\u0637' : 'el-ṭ' # الط
162
+ '\b\u0627\u0644\u0638' : # الظ
163
+ - 'el-ẓ'
164
+ - 'el-d'
165
+ '\b\u0627\u0644\u0644' : 'el-l' # الل
166
+ '\b\u0627\u0644\u0646' : 'el-n' # الن
167
+
168
+
169
+ # shadda
170
+ '\u062b\u0651' : # ث
171
+ - 'thth'
172
+ - 'tt'
173
+ '\u062c\u0651' : # ج
174
+ - 'gg'
175
+ - 'jj'
176
+ '\u062d\u0651' : 'ḥḥ' # ح
177
+ '\u062e\u0651' : 'khkh' # خ
178
+
179
+ '\u0633\u0651' : # س
180
+ - 'ss'
181
+ - 'cc'
182
+ '\u0635\u0651' : 'ṣṣ' # ص
183
+ '\u0636\u0651' : 'ḍḍ' # ض
184
+ '\u0637\u0651' : 'ṭṭ' # ط
185
+ '\u0638\u0651' : # ظ
186
+ - 'ẓẓ'
187
+ - 'dd'
188
+ '\u0642\u0651' : # ق
189
+ - 'qq'
190
+ - 'kk'
191
+
192
+ '\b\u0627\u0644' : 'el-' # ال
193
+
194
+ # normal letters
195
+ '\u062c' : # ج
196
+ - 'g'
197
+ - 'j'
198
+ '\ufe9f' : # ﺟ
199
+ - 'g'
200
+ - 'j'
201
+ '\ufea0' : # ﺠ
202
+ - 'g'
203
+ - 'j'
204
+ '\ufe9e' : # ﺞ
205
+ - 'g'
206
+ - 'j'
207
+
208
+ '\u062d' : 'ḥ' # ح
209
+ '\ufea3' : 'ḥ' # ﺣ
210
+ '\ufea4' : 'ḥ' # ﺤ
211
+ '\ufea2' : 'ḥ' # ﺢ
212
+
213
+ '\u062e' : 'kh' # خ
214
+ '\ufea7' : 'kh' # ﺧ
215
+ '\ufea8' : 'kh' # ﺨ
216
+ '\ufea6' : 'kh' # ﺦ
217
+
218
+ '\u0630' : # ذ
219
+ - 'dh'
220
+ - 'z'
221
+ '\ufeac' : # ﺬ
222
+ - 'dh'
223
+ - 'z'
224
+
225
+
226
+ '\u0633' : # س
227
+ - 's'
228
+ - 'c'
229
+ '\ufeb3' : # ﺳ
230
+ - 's'
231
+ - 'c'
232
+ '\ufeb4' : # ﺴ
233
+ - 's'
234
+ - 'c'
235
+ '\ufeb2' : # ﺲ
236
+ - 's'
237
+ - 'c'
238
+
239
+ '\u0635' : 'ṣ' # ص
240
+ '\ufebb' : 'ṣ' # ﺻ
241
+ '\ufebc' : 'ṣ' # ﺼ
242
+ '\ufeba' : 'ṣ' # ﺺ
243
+
244
+ '\u0636' : 'ḍ' # ض
245
+ '\ufebf' : 'ḍ' # ﺿ
246
+ '\ufec0' : 'ḍ' # ﻀ
247
+ '\ufebe' : 'ḍ' # ﺾ
248
+
249
+ '\u0637' : 'ṭ' # ط
250
+ '\ufec3' : 'ṭ' # ﻃ
251
+ '\ufec4' : 'ṭ' # ﻄ
252
+ '\ufec2' : 'ṭ' # ﻂ
253
+
254
+ '\u0639' : '‛' # ع
255
+ '\ufecb' : '‛' # ﻋ
256
+ '\ufecc' : '‛' # ﻌ
257
+ '\ufeca' : '‛' # ﻊ
258
+
259
+ '\u0638' : # ظ
260
+ - 'ẓ'
261
+ - 'd'
262
+ '\ufec7' : # ظ
263
+ - 'ẓ'
264
+ - 'd'
265
+ '\ufec8' : # ظ
266
+ - 'ẓ'
267
+ - 'd'
268
+ '\ufec6' : # ظ
269
+ - 'ẓ'
270
+ - 'd'
271
+
272
+ '\u0642' : # ق
273
+ - 'q'
274
+ - 'k'
275
+ '\ufed7' : # ﻗ
276
+ - 'q'
277
+ - 'k'
278
+ '\ufed8' : # ﻘ
279
+ - 'q'
280
+ - 'k'
281
+ '\ufed6' : # ﻖ
282
+ - 'q'
283
+ - 'k'