interscript 0.1.3 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (294) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +10 -11
  3. data/aliases.json +1 -0
  4. data/lib/interscript.rb +62 -59
  5. data/lib/interscript/command.rb +3 -2
  6. data/lib/interscript/fs.rb +96 -0
  7. data/lib/interscript/mapping.rb +36 -17
  8. data/lib/interscript/opal.rb +196 -0
  9. data/lib/interscript/opal/entrypoint.rb +20 -0
  10. data/lib/interscript/opal/exports.rb +11 -0
  11. data/lib/interscript/opal/maps.js.erb +8 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/maps/acadsin-zho-Hani-Latn-2002.yaml +6 -2
  14. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  15. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  16. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  17. data/maps/alalc-asm-Deva-Latn-1997.yaml +259 -0
  18. data/maps/alalc-asm-Deva-Latn-2012.yaml +55 -0
  19. data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
  20. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  21. data/maps/{alalc-bel-cyrl-latn-1997.yaml → alalc-bel-Cyrl-Latn-1997.yaml} +7 -3
  22. data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  25. data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
  26. data/maps/alalc-ell-Grek-Latn-1997.yaml +7 -4
  27. data/maps/alalc-ell-Grek-Latn-2010.yaml +3 -5
  28. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  29. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  30. data/maps/alalc-hin-Deva-Latn-1997.yaml +303 -0
  31. data/maps/alalc-hin-Deva-Latn-2011.yaml +65 -0
  32. data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
  33. data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
  34. data/maps/alalc-kat-Geok-Latn-1997.yaml +2 -3
  35. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  36. data/maps/alalc-kor-Hang-Latn-1997.yaml +6 -2
  37. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  38. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  39. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  40. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  41. data/maps/{alalc-mkd-cyrl-latn-1997.yaml → alalc-mkd-Cyrl-Latn-1997.yaml} +1 -1
  42. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  43. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  44. data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
  45. data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
  46. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  47. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  48. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  49. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  50. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  51. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  52. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  53. data/maps/alalc-san-Deva-Latn-2012.yaml +241 -0
  54. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  55. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  56. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  57. data/maps/{alalc-srp-cyrl-latn-2013.yaml → alalc-srp-Cyrl-Latn-2013.yaml} +1 -1
  58. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  59. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  60. data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
  61. data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
  62. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  63. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  64. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  65. data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
  66. data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
  67. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -2
  68. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  69. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -3
  70. data/maps/bgn-kor-Hang-Latn-1943.yaml +8 -4
  71. data/maps/bgn-kor-Kore-Latn-1943.yaml +4 -4
  72. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  73. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  75. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +598 -0
  76. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  77. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
  78. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  79. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
  80. data/maps/{bgnpcgn-bel-cyrl-latn-1979.yaml → bgnpcgn-bel-Cyrl-Latn-1979.yaml} +5 -1
  81. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +14 -10
  82. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  83. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  84. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
  85. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +8 -5
  86. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -2
  87. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
  88. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  89. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
  90. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  91. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  92. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -2
  93. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
  94. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
  95. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +18 -18
  96. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +3 -3
  97. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +3 -3
  98. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
  99. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  100. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +2 -2
  101. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  102. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  103. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +338 -0
  104. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +673 -0
  105. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  106. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
  107. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  108. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  109. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
  110. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  111. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  112. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  113. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -2
  114. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  115. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
  116. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  117. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  118. data/maps/{bgnpcgn-chn-Hans-Latn-1979.yaml → bgnpcgn-zho-Hans-Latn-1979.yaml} +1 -1
  119. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  120. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  121. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  122. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  123. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +173 -0
  124. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  125. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +175 -0
  126. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  127. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  128. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  129. data/maps/by-bel-Cyrl-Latn-1998.yaml +9 -5
  130. data/maps/by-bel-Cyrl-Latn-2007.yaml +4 -4
  131. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  132. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  133. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  134. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  135. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  136. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  137. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  138. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  139. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  140. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  141. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +7 -8
  142. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +6 -7
  143. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -3
  144. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -3
  145. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -2
  146. data/maps/{gki-bel-cyrl-latn-1992.yaml → gki-bel-Cyrl-Latn-1992.yaml} +2 -2
  147. data/maps/{gki-bel-cyrl-latn-2000.yaml → gki-bel-Cyrl-Latn-2000.yaml} +2 -2
  148. data/maps/{gost-rus-cyrl-latn-16876-71-1983.yaml → gost-rus-Cyrl-Latn-16876-71-1983.yaml} +8 -4
  149. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  150. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  151. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -6
  152. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -5
  153. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -2
  154. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  155. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  156. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  157. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  158. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  159. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  160. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  161. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  162. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +11 -8
  163. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -5
  164. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  165. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  166. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  167. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  168. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +220 -0
  169. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  170. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  171. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  172. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  173. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  174. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  175. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  176. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  177. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  178. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  179. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  180. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  181. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  182. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  183. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -4
  184. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  185. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  186. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  187. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +2 -2
  188. data/maps/kp-kor-Hang-Latn-2002.yaml +29 -21
  189. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +3 -3
  190. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  191. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  192. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  193. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  194. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  195. data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
  196. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  197. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  198. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  199. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  200. data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
  201. data/maps/odni-ara-Arab-Latn-2015.yaml +315 -0
  202. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  203. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  204. data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
  205. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  206. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  207. data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
  208. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  209. data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
  210. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  211. data/maps/odni-kat-Geor-Latn-2015.yaml +2 -3
  212. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  213. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  214. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  215. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
  216. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  217. data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
  218. data/maps/odni-prs-Arab-Latn-2015.yaml +228 -0
  219. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  220. data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
  221. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  222. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  223. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  224. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
  225. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  226. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +6 -2
  227. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  228. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  229. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +5 -5
  230. data/maps/royin-tha-Thai-Latn-1968.yaml +9 -5
  231. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +5 -5
  232. data/maps/royin-tha-Thai-Latn-1999.yaml +8 -4
  233. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  234. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  235. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  236. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  237. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  238. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  239. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  240. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  241. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  242. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  243. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  244. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  245. data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
  246. data/maps/un-bel-Cyrl-Latn-2007.yaml +4 -4
  247. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  248. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +44 -44
  249. data/maps/un-ell-Grek-Latn-1987-tl.yaml +3 -4
  250. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -4
  251. data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
  252. data/maps/un-hin-Deva-Latn-2016.yaml +316 -0
  253. data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
  254. data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
  255. data/maps/un-mar-Deva-Latn-2016.yaml +102 -0
  256. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  257. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  258. data/maps/un-nep-Deva-Latn-1972.yaml +269 -0
  259. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  260. data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
  261. data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
  262. data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
  263. data/maps/un-rus-Cyrl-Latn-1987.yaml +2 -2
  264. data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
  265. data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
  266. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  267. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  268. data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
  269. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
  270. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
  271. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  272. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  273. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  274. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +4 -4
  275. data/maps/var-kor-Hang-Latn-mr-1939.yaml +4 -4
  276. data/maps/var-kor-Kore-Hang-2013.yaml +2 -2
  277. data/maps/var-kor-Kore-Latn-mr-1939.yaml +2 -3
  278. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  279. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  280. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  281. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  282. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  283. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  284. data/maps/var-tha-Thai-Thai-phonemic.yaml +6 -6
  285. data/maps/var-tha-Thai-Zsym-ipa.yaml +13 -13
  286. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +13 -9
  287. data/spec/interscript/filenames_spec.rb +21 -0
  288. data/spec/interscript_spec.rb +16 -5
  289. metadata +275 -27
  290. data/bin/interscript +0 -41
  291. data/bin/rspec +0 -29
  292. data/bin/setup +0 -8
  293. data/maps/un-mon-Mong-Latn-2013.yaml +0 -93
  294. data/maps/un-ukr-cyrl-latn-1998.yaml +0 -30
@@ -0,0 +1,166 @@
1
+ ---
2
+ authority_id: odni
3
+ id: 2015
4
+ language: iso-639-2:uzb
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Office of the Director Of National Intelligence Uzbek Personal Names 2015, ICS-630-01 Annex V
8
+ # url:
9
+ source: ICS-630-01 Annex V
10
+ creation_date: 2015
11
+ confirmation_date: 2015
12
+ description: |
13
+ This system is the Intelligence Community standard for the transliteration of Uzbek person names
14
+ that will be applied to all final written reports and products for IC consumers. It is not intended to
15
+ eliminate variations of a name that can contribute forensic information. Rather, it is to provide an
16
+ IC standard Romanized (English) transliteration from Uzbek that can then be linked to forensic
17
+ information in ways that will help identify the referent of the name.
18
+
19
+ In cases where an individual’s name has already been transliterated in a variant spelling, the IC
20
+ Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the first
21
+ usage. In addition, if the original Cyrillic-script spelling is known, that spelling should also
22
+ appear in parentheses following the name, if possible, following best practices of the issuing
23
+ organization and taking into consideration information system capabilities. For example:
24
+ Farkhod Tojiev (also seen as Farhod Tadjiyev, Фарход Тожиев). This convention is designed to
25
+ ensure that vital forensic information is not lost.
26
+
27
+ For names of persons who are known to not be part of the Uzbek-speaking community, use the
28
+ relevant IC transliteration standard for names from that language (e.g., Yitzhak). A translator’s
29
+ note may be used to clarify the known origin of the person. Spell names of individuals from
30
+ languages that are written in Roman letters as they are spelled in those languages (e.g., George
31
+ Clooney, Jorge Garcia, Georges Pompidou).
32
+
33
+ In the case of active senior government officials in the on-line CIA World Factbook and the online directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings
34
+ given in these on-line reference works should be used in place of the IC Standard. For any
35
+ individual who has at one time been listed in the Factbook or Chiefs of State directory but who no
36
+ longer appears in those resources (i.e. is no longer a government official), the IC Standard
37
+ spelling should appear first, with the spelling, if known, as it previously appeared in those
38
+ resources listed within parentheses at the first usage.
39
+
40
+ The primary goal is to produce a consistent Romanized transcription of names that is specifically
41
+ readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
42
+ (English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use
43
+ of diacritics. However, within the context of a report, where additional information about the
44
+ individual is provided, the referent will be clearly identified. This system will be used in
45
+ conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
46
+ names of well-known individuals.
47
+
48
+ notes:
49
+ - Transliterate double digraphs as a single digraph, i.e. шш -> sh, not shsh
50
+ - In the Roman, no distinction is made between digraphs such as 'sh' and single contiguous letters, (e.g. 's' followed by 'h').
51
+ - The Cyrillic ъ and ь are not transliterated, but instead are left out of the transliteration.
52
+
53
+ tests:
54
+ - source: Фарход Тожиев
55
+ expected: Farkhod Tojiev
56
+ - source: Барча одамлар эркин, қадр-қиммат в ҳуқуқлард тенг бўлиб туғиладилар. Улар ақл в виждон соҳибидирлар в бир-бирлари ила биродарларча муомал қилишларь зарур.
57
+ expected: Barcha odamlar erkin, qadr-qimat v huquqlard teng bolib tughiladilar. Ular aql v vijdon sohibidirlar v bir-birlari ila birodarlarcha muomal qilishlar zarur.
58
+ - source: Тутук белгись
59
+ expected: Tutuk belgis
60
+ - source: Янги юл
61
+ expected: Yangi iul
62
+ - source: Ўзбек ёзуви
63
+ expected: Ozbek yozuvi
64
+ - source: Чиғатай гурунги
65
+ expected: Chighatay gurungi
66
+ - source: ъ
67
+ expected: ''
68
+ - source: шш
69
+ expected: sh
70
+ - source: ччччч
71
+ expected: ch
72
+
73
+ map:
74
+ rules:
75
+ # note[1]
76
+ - pattern: "(.)\\1{1,}"
77
+ result: "\\1"
78
+
79
+ characters:
80
+ '\u0410': 'A' # А
81
+ '\u0411': 'B' # Б
82
+ '\u0412': 'V' # В
83
+ '\u0413': 'G' # Г
84
+ '\u0492': 'Gh' # Ғ
85
+ '\u0414': 'D' # Д
86
+ '\u0415': 'E' # Е
87
+ '\u0401': 'Yo' # Ё
88
+ '\u0416': 'J' # Ж
89
+ '\u0417': 'Z' # З
90
+ '\u0418': 'I' # И
91
+ '\u0419': 'Y' # Й
92
+ '\u041A': 'K' # К
93
+ '\u049A': 'Q' # Қ
94
+ '\u041B': 'L' # Л
95
+ '\u041C': 'M' # М
96
+ '\u041D': 'N' # Н
97
+ '\u041E': 'O' # О
98
+ '\u041F': 'P' # П
99
+ '\u0420': 'R' # Р
100
+ '\u0421': 'S' # С
101
+ '\u0422': 'T' # Т
102
+ '\u0423': 'U' # У
103
+ '\u040E': 'O' # Ў
104
+ '\u0424': 'F' # Ф
105
+ '\u0425': 'Kh' # Х
106
+ '\u04B2': 'H' # Ҳ
107
+ '\u0426': 'Ts' # Ц
108
+ '\u0427': 'Ch' # Ч
109
+ '\u0428': 'Sh' # Ш
110
+ '\u042D': 'E' # Э
111
+ '\u042E': 'Yu' # Ю
112
+ '\u042F': 'Ya' # Я
113
+
114
+ '\u0430': 'a' # а
115
+ '\u0431': 'b' # б
116
+ '\u0432': 'v' # в
117
+ '\u0433': 'g' # г
118
+ '\u0493': 'gh' # ғ
119
+ '\u0434': 'd' # д
120
+ '\u0435': 'e' # e
121
+ '\u0451': 'yo' # ё
122
+ '\u0436': 'j' # ж
123
+ '\u0437': 'z' # з
124
+ '\u0438': 'i' # и
125
+ '\u0439': 'y' # й
126
+ '\u043A': 'k' # к
127
+ '\u049B': 'q' # қ
128
+ '\u043B': 'l' # л
129
+ '\u043C': 'm' # м
130
+ '\u043D': 'n' # н
131
+ '\u043E': 'o' # о
132
+ '\u043F': 'p' # п
133
+ '\u0440': 'r' # р
134
+ '\u0441': 's' # с
135
+ '\u0442': 't' # т
136
+ '\u0443': 'u' # у
137
+ '\u045E': 'o' # ў
138
+ '\u0444': 'f' # ф
139
+ '\u044B': 'y' # ы
140
+ '\u0447': 'ch' # ч
141
+ '\u044F': 'ia' # я
142
+ '\u044E': 'iu' # ю
143
+ '\u0445': 'kh' # х
144
+ '\u04B3': 'h' # ҳ
145
+ '\u0448': 'sh' # ш
146
+ '\u044D': 'e' # э
147
+ '\u0449': 'shch' # щ
148
+ '\u0446': 'ts' # ц
149
+ '\u0491': 'g' # ґ
150
+ '\u046B': 'u' # ѫ
151
+ '\u0452': 'd' # ђ
152
+ '\u0455': 'dz' # ѕ
153
+ '\u0458': 'j' # ј
154
+ '\u0459': 'lj' # љ
155
+ '\u045A': 'nj' # њ
156
+ '\u04BB': 'c' # һ
157
+ '\u045F': 'dz' # џ
158
+ '\u0454': 'ie' # є
159
+ '\u0457': 'i' # ї
160
+ '\u0453': 'g' # ѓ
161
+
162
+ # note[3]
163
+ '\u042a': '' # Ъ
164
+ '\u042c': '' # Ь
165
+ '\u044a': '' # ъ
166
+ '\u044c': '' # ь
@@ -1,17 +1,17 @@
1
1
  ---
2
2
  authority_id: royin
3
3
  id: 1939-generic
4
- language: tha
4
+ language: iso-639-2:tha
5
5
  source_script: Thai
6
6
  destination_script: Latn
7
7
  name: Royal Thai General System of Transcription (1939) Generic
8
8
  url: http://www.siamese-heritage.org/jsspdf/1941/JSS_033_1d_RoyalInstituteTranscriptionOfThaiIntoRomanCharacters.pdf
9
9
  creation_date: 1939
10
- adoption_date:
10
+ adoption_date:
11
11
  description: |
12
12
  This map loads two external maps to convert Thai text first into phonemic Thai,
13
13
  and then into IPA transcription.
14
-
14
+
15
15
  The IPA transcription will then be handled by this map, and converted into
16
16
  Royal Thai General System of Transcription (1939)
17
17
 
@@ -37,7 +37,7 @@ chain: ["var-tha-Thai-Thai-phonemic" ,"var-tha-Thai-Zsym-ipa"]
37
37
 
38
38
  map:
39
39
  title-case: false
40
- word_separator: " "
40
+ word_separator: " "
41
41
 
42
42
  rules:
43
43
  - pattern: '[˩˨˧˦˥]'
@@ -62,7 +62,7 @@ map:
62
62
  'ŋ': 'ng'
63
63
  'j': 'y'
64
64
  'ɔ': 'o̦'
65
- 'ɤ': 'œ'
65
+ 'ɤ': 'œ'
66
66
  'ɛ': 'æ'
67
67
  'ɯ': 'ư'
68
68
  'ʰ': 'h'
@@ -1,17 +1,21 @@
1
1
  ---
2
2
  authority_id: royin
3
3
  id: 1968-chained
4
- language: tha
4
+ language: iso-639-2:tha
5
5
  source_script: Thai
6
6
  destination_script: Latn
7
7
  name: Royal Thai General System of Transcription (1968)
8
+ alias:
9
+ ogc11122:
10
+ code: tha_Thai2Latn_RIT_1968
11
+ description: Thai Royal Institute of Thailand 1968 System (out of date)
8
12
  url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
13
  creation_date: 1968
10
- adoption_date:
14
+ adoption_date:
11
15
  description: |
12
16
  This map loads two external maps to convert Thai text first into phonemic Thai,
13
17
  and then into IPA transcription.
14
-
18
+
15
19
  The IPA transcription will then be handled by this map, and converted into
16
20
  Royal Thai General System of Transcription (1968).
17
21
 
@@ -124,7 +128,7 @@ chain: ["var-tha-Thai-Thai-phonemic" ,"var-tha-Thai-Zsym-ipa"]
124
128
 
125
129
  map:
126
130
  title-case: false
127
- word_separator: " "
131
+ word_separator: " "
128
132
 
129
133
  rules:
130
134
  - pattern: '[˩˨˧˦˥]'
@@ -151,7 +155,7 @@ map:
151
155
  'ŋ': 'ng'
152
156
  'j': 'y'
153
157
  'ɔ': 'o'
154
- 'ɤ': 'oe'
158
+ 'ɤ': 'oe'
155
159
  'ɛ': 'ae'
156
160
  'ɯ': 'u'
157
161
  'ʰ': 'h'
@@ -1,17 +1,17 @@
1
1
  ---
2
2
  authority_id: royin
3
3
  id: 1999-chained
4
- language: tha
4
+ language: iso-639-2:tha
5
5
  source_script: Thai
6
6
  destination_script: Latn
7
7
  name: Royal Thai General System of Transcription (1999)
8
8
  url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
9
  creation_date: 1999
10
- adoption_date:
10
+ adoption_date:
11
11
  description: |
12
12
  This map loads two external maps to convert Thai text first into phonemic Thai,
13
13
  and then into IPA transcription.
14
-
14
+
15
15
  The IPA transcription will then be handled by this map, and converted into
16
16
  Royal Thai General System of Transcription (1999)
17
17
 
@@ -125,7 +125,7 @@ chain: ["var-tha-Thai-Thai-phonemic" ,"var-tha-Thai-Zsym-ipa"]
125
125
 
126
126
  map:
127
127
  title-case: false
128
- word_separator: " "
128
+ word_separator: " "
129
129
 
130
130
  rules:
131
131
  - pattern: '[˩˨˧˦˥]'
@@ -152,7 +152,7 @@ map:
152
152
  'ŋ': 'ng'
153
153
  'j': 'y'
154
154
  'ɔ': 'o'
155
- 'ɤ': 'oe'
155
+ 'ɤ': 'oe'
156
156
  'ɛ': 'ae'
157
157
  'ɯ': 'ue' # New spelling, was u in 1968
158
158
  'ʰ': 'h'
@@ -1,13 +1,17 @@
1
1
  ---
2
2
  authority_id: royin
3
3
  id: 1999
4
- language: tha
4
+ language: iso-639-2:tha
5
5
  source_script: Thai
6
6
  destination_script: Latn
7
7
  name: Royal Thai General System of Transcription (1999)
8
+ alias:
9
+ ogc11122:
10
+ code: tir_Thai2Latn_RIT_2000
11
+ description: Thai Royal Institute of Thailand 2000 System
8
12
  url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
13
  creation_date: 1999
10
- adoption_date:
14
+ adoption_date:
11
15
  description:
12
16
 
13
17
  notes: |
@@ -48,7 +52,7 @@ tests:
48
52
 
49
53
  map:
50
54
  title-case: false
51
- word_separator: " "
55
+ word_separator: " "
52
56
  transcription: "sequitur.pythainlp_lexicon"
53
57
 
54
58
  rules:
@@ -68,7 +72,7 @@ map:
68
72
  'j': 'i'
69
73
  'w': 'o'
70
74
  'ɔ': 'o'
71
- 'ɤ': 'oe'
75
+ 'ɤ': 'oe'
72
76
  'ɛ': 'ae'
73
77
  'ɯ': 'ue'
74
78
  'ʔ' : ''
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: sac
3
3
  id: 1979
4
- language: chn
4
+ language: iso-639-2:chn
5
5
  source_script: Hans
6
6
  destination_script: Latn
7
7
  name: Pinyin
8
+ alias:
9
+ ogc11122:
10
+ code: zho_Hani2Latn_GCH_1979
11
+ description: Chinese Hanyu Pinyin 1979 System
8
12
  url: ftp://ftp.cuhk.hk/pub/chinese/ifcss/software/data/Uni2Pinyin.gz
9
13
  creation_date: 1996-04-17
10
14
  description: |
@@ -0,0 +1,389 @@
1
+ ---
2
+ authority_id: sasm
3
+ id: general-1978
4
+ language: iso-639-2:mon
5
+ source_script: Mong
6
+ destination_script: Latn
7
+ name: Transliteration of Place Names in Minority Languages in Chinese Pinyin (Mongolian, general)
8
+ url: http://www.moe.gov.cn/ewebeditor/uploadfile/2015/01/12/20150112161436994.pdf
9
+ creation_date: 1976-06
10
+ description: |
11
+ Article 1
12
+
13
+ The main purpose of the transliteration method of Chinese pinyin
14
+ letter transliteration of place names in minority languages:
15
+
16
+ (1) As a standard for spelling place names in minority languages ​​
17
+ with Chinese phonetic alphabet;
18
+ (2) As a phonetic tool for surveying and recording ethnic place
19
+ names in map surveying and mapping work;
20
+ (3) As the main basis for the pronunciation and selection of place
21
+ names in ethnic minority languages ​​in Chinese character
22
+ transliteration;
23
+ (4) Provide convenient conditions for the unified compilation of my
24
+ country's place-name information and index in alphabetical order.
25
+
26
+ Article 2
27
+
28
+ The transliteration method is limited to the 26 letters in the
29
+ "Hanyu Pinyin Plan", two letters with additional symbols and a
30
+ sound-proof symbol. In order to make the transcription and phonetic
31
+ more accurate, the syllable structure can not be restricted by the
32
+ syllable form of Mandarin Chinese. Soundproof symbols can be used
33
+ in various occasions that are easy to be confused. When recording,
34
+ additional symbols can be added to specific letters to represent
35
+ special sounds.
36
+
37
+ The transliteration and transliteration of ethnic minority scripts
38
+ in Latin script shall be based on the script. Letters with the same
39
+ or similar pronunciation and usage as in the "Hanyu Pinyin Plan"
40
+ shall be written according to them; different or dissimilar letters
41
+ shall be transcribed separately. If the text does not use Latin
42
+ letters, the corresponding Chinese phonetic letters shall be used
43
+ according to the pronunciation of the text. If there is no text,
44
+ according to the general voice mark.
45
+
46
+ Article 3
47
+
48
+ Special place names are handled with reference to the following
49
+ methods:
50
+
51
+ (1) If the commonly used Chinese name is partly transliterated and
52
+ partly translated, the transliteration part is spelled according to
53
+ the transliteration method, and the free translation part is
54
+ spelled according to the pronunciation of the Chinese character.
55
+
56
+ (2) If the commonly used Chinese character translation is a section
57
+ translation, the actual situation may be considered. Some are
58
+ transliterated according to the full name of the original name, and
59
+ some are spelled according to the Hanyu pronunciation of the
60
+ section translation.
61
+
62
+ (3) If the translated name of a Chinese character originally came
63
+ from a minority language, but later became a Chinese form and has
64
+ been commonly used, it can be spelled according to the
65
+ pronunciation of the Chinese character, including the original name
66
+ transliterated if necessary.
67
+
68
+ (4) Other special circumstances shall be dealt with according to
69
+ specific discretion.
70
+
71
+ original_description: |
72
+ 第一条
73
+
74
+ 少数民族语地名汉语拼音字母音译转写法的主要用途:
75
+
76
+ (1) 作为用汉语拼音字母拼写少数民族语地名的标准;
77
+ (2)作为地图测绘工作中调査记录少数民族语地名的记音工具;
78
+ (3) 作为汉字音译少数民族语地名定音和选字的主要依据;
79
+ (4)为按照字母颐序统一编排我国地名资料和索引提供便利条件。
80
+
81
+ 第二条
82
+
83
+ 音译转写法限用《汉语拼音方案》中的26个字母,两个有附加符号的字母和一
84
+ 个隔音符号,为了使转写和记音比较准确,音节结构可以不受汉语普通话音节
85
+ 形式的限制,隔音符号可以在各种
86
+ 容易混淆的场合应用,记音的时候附加符号可以加在特定的字母上面代表特殊
87
+ 语音。
88
+
89
+
90
+ 少数民族文字用拉丁字母的,音译转写以其文字为依据。跟《汉语拼音方案》
91
+ 中读音和用法相同或相近的字母,一律照写;不同或不相近的字母分别规定转
92
+ 写方式,文字不用拉丁字母的,根据文字的读音采用相应的汉语拼音字母表示
93
+ 。没有文字的,根据通用语音标记。
94
+
95
+ 第三条
96
+
97
+ 特殊的地名参照下列办法处理:
98
+
99
+
100
+ (1)惯用的汉字译名如果是一部分音译,一部分意译,其音译部分根据音译转
101
+ 写法拼写,意译部分按照汉字读音拼写。
102
+
103
+
104
+ (2)惯用的汉字译名如果是节译,可以斟酌具体体情况,有的按照原名全称音
105
+ 译转写,有的按照节译的汉宇读音拼写。
106
+
107
+ (3) 汉字译名如果原先来自少数民族语,后来变成汉语形式并且已经通用,可以按
108
+ 照汉字读音拼写,必要时括注音译转写的原名。
109
+
110
+ (4) 其他特殊情况具体斟酌处理。
111
+
112
+ notes:
113
+ - The transliteration of Mongolian place names is based on the
114
+ customary pronunciation combining written and spoken languages.
115
+ - The length of Mongolian vowels are generally spelled regardless
116
+ of their spelling. Long vowels in place names are represented by
117
+ double letters.
118
+ - The Chinese phonetic alphabets transliterated by transliteration
119
+ are juxtaposed with or without symbols and adjuncts. Normally, the
120
+ spelling letters are without symbols, and the place names are
121
+ recorded by the acronym.
122
+
123
+ original_notes:
124
+ (1) 蒙古语地名的音译转写,以书面语和口语通用相结合的习惯读法为依据。
125
+ (2) 蒙古语元音的长短,一般拼写不分,地名记音中长元音用双字母表示。
126
+ (3) 音译转写的汉语拼音字母有无符和加符并列的,一般拼写用无符字母,地名记音用加符宇母。
127
+
128
+ implementation_notes:
129
+ - A separated final form of vowels a or e is common, and can appear at the end
130
+ of a word, word stem, or suffix. This form requires a final-shaped preceding
131
+ consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
132
+ and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
133
+ with a hyphen. In digital typesetting, these forms are triggered by inserting
134
+ a U+180E ᠎ MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
135
+ and vowel.
136
+ - All case suffixes, as well as any plural suffixes consisting of one or two
137
+ syllables are likewise separated by a preceding and hyphen-transliterated gap.
138
+ In digital typesetting, this gap is represented by a U+202F   NARROW NO-BREAK SPACE
139
+ (HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
140
+ Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
141
+ as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
142
+ 'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
143
+ medial- (vowels), or variant-shaped form.
144
+
145
+ tests:
146
+ - source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
147
+ expected: ordos hota
148
+ - source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
149
+ expected: bayannagur hota
150
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
151
+ expected: ulaganhota
152
+ - source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
153
+ expected: hoolia goul hota
154
+ - source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
155
+ expected: eriyen hota
156
+ - source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
157
+ expected: rasiyan hota
158
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
159
+ expected: bagarin baragun hosigu
160
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
161
+ expected: bagarin jegun hosigu
162
+ - source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
163
+ expected: tungliyou hota
164
+ - source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
165
+ expected: sili-yin hota
166
+ - source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
167
+ expected: horin ger siyan
168
+ - source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
169
+ expected: uda togorig
170
+ - source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
171
+ expected: uhai hota
172
+ - source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
173
+ expected: hayinan togorig
174
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
175
+ expected: hayirub-un tohoi togorig
176
+ - source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
177
+ expected: ulaganqab hota
178
+ - source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
179
+ expected: jining togorig
180
+ - source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
181
+ expected: fwngjwe hota
182
+ - source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
183
+ expected: juwezi siyan
184
+ - source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
185
+ expected: huwade siyan
186
+ - source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
187
+ expected: xangdu siyan
188
+ - source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
189
+ expected: singhe siyan
190
+ - source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
191
+ expected: liyangqang siyan
192
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
193
+ expected: qahar baragun garun emunedu hosigu
194
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
195
+ expected: qahar baragun garun dumdadu hosigu
196
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
197
+ expected: qahar baragun garun hoyitu hosigu
198
+ - source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
199
+ expected: dorbed hosigu
200
+ - source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
201
+ expected: bugutu hota
202
+ - source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
203
+ expected: hondelen togorig
204
+ - source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
205
+ expected: dunghe togorig
206
+ - source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
207
+ expected: qingxan togorig
208
+ - source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
209
+ expected: siguyitu togorig
210
+ - source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
211
+ expected: jiu yuwan togorig
212
+ - source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
213
+ expected: guyang siyan
214
+ - source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
215
+ expected: tumed jegun hosigu
216
+ - source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
217
+ expected: tumed baragun hosigu
218
+ - source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
219
+ expected: darhan muumingg᠋an holbogatu hosigu
220
+ - source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
221
+ expected: hesigten hosigu
222
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
223
+ expected: sin-e bargu jegun hosigu
224
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
225
+ expected: sin-e bargu baragun hosigu
226
+ - source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
227
+ expected: otog hosigu
228
+ - source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
229
+ expected: d᠋ungxeng togorig
230
+ - source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
231
+ expected: dalad hosigu
232
+ - source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
233
+ expected: jegungar hosigu
234
+ - source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
235
+ expected: otog-un emunedu hosigu
236
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
237
+ expected: hanggin hosigu
238
+ - source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
239
+ expected: uusin hosigu
240
+ - source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
241
+ expected: ejin horog-a hosigu
242
+ - source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
243
+ expected: jalan ai᠌l hota
244
+ - source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
245
+ expected: yagsi hota
246
+ - source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
247
+ expected: manjuur hota
248
+ - source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
249
+ expected: hayilar togorig
250
+ - source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
251
+ expected: horqin togorig
252
+ - source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
253
+ expected: kayilu siyan
254
+ - source: ᠬᠦᠷᠢᠶ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
255
+ expected: huriy-e hosigu
256
+ - source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
257
+ expected: naiman hosigu
258
+ - source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
259
+ expected: jarud hosigu
260
+ - source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
261
+ expected: horqin baragun garun dumdadu hosigu
262
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
263
+ expected: horqin jegun garun dumdadu hosigu
264
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
265
+ expected: horqin jegun garun hoyitu hosigu
266
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
267
+ expected: ulaganhada hota
268
+ - source: ᠰᠡᠷᠡᠴᠢ # Salaqi
269
+ expected: sereqi
270
+ - source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
271
+ expected: gegen goul hota
272
+ - source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
273
+ expected: alaxa jegun hosigu
274
+ - source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
275
+ expected: alaxa baragun hosigu
276
+ - source: ᠡᠵᠡᠨ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
277
+ expected: ejen-e hosigu
278
+ - source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
279
+ expected: hobegetu sir-a hosigu
280
+ - source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
281
+ expected: uyuwan siyan
282
+ - source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
283
+ expected: uquwan siyan
284
+ - source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
285
+ expected: tuqiuwan siyan
286
+ - source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
287
+ expected: ningqeng siyan
288
+ - source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
289
+ expected: linsi siyan
290
+ - source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
291
+ expected: linhe togorig
292
+ - source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
293
+ expected: haraqin hosigu
294
+ - source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
295
+ expected: d᠋engkeu siyan
296
+ - source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
297
+ expected: auhan hosigu
298
+ - source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
299
+ expected: qing xui he siyan
300
+ - source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
301
+ expected: hodong arad-un togorig
302
+ - source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
303
+ expected: sayihan togorig
304
+ - source: ᠰᠢᠨ᠎ᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
305
+ expected: sin-e hota togorig
306
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
307
+ expected: hayirub-un tohoi togorig
308
+ - source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
309
+ expected: sung xan togorig
310
+ - source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
311
+ expected: hung xan togorig
312
+ - source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
313
+ expected: arun hosigu
314
+ - source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
315
+ expected: yuwan boo xan togorig
316
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
317
+ expected: silugun hobegetu qagan hosigu
318
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
319
+ expected: silugun hohe hosigu
320
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
321
+ expected: urad-un dumdadu hosigu
322
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
323
+ expected: urad-un emunedu hosigu
324
+ - source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
325
+ expected: togtahu siyan
326
+ - source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
327
+ expected: tayipuse hosigu
328
+ - source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
329
+ expected: soned jegun hosigu
330
+ - source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
331
+ expected: soned baragun hosigu
332
+ - source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
333
+ expected: ongnigud hosigu
334
+ - source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
335
+ expected: jalaid hosigu
336
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
337
+ expected: hanggin hoyitu hosigu
338
+ - source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
339
+ expected: jegun ujumuqin hosigu
340
+ - source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
341
+ expected: aru horqin hosigu
342
+ - source: ᠠᠪᠠᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
343
+ expected: abag-a hosigu
344
+ - source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
345
+ expected: buriyad
346
+ - source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
347
+ expected: ulaganbagatur
348
+
349
+ map:
350
+
351
+ characters:
352
+ "ᠠ": "a" # \u1820
353
+ "ᠪ": "b" # \u182a
354
+ "ᠼ": "c" # \u183c
355
+ "ᠲ": "d" # \u1832
356
+ "ᠳ": "d" # \u1833
357
+ "ᠡ": "e" # \u1821
358
+ "ᠹ": "f" # \u1839
359
+ "ᠭ": "g" # \u182d
360
+ "ᠺ": "g" # \u183a
361
+ "ᠬ": "h" # \u182c
362
+ "ᠾ": "h" # \u183e
363
+ "ᠢ": "i" # \u1822
364
+ "ᠵ": "j" # \u1835
365
+ "ᠺ": "k" # \u183a
366
+ "ᠯ": "l" # \u182f
367
+ "ᠮ": "m" # \u182e
368
+ "ᠨ": "n" # \u1828
369
+ "ᠥ": "o" # \u1825
370
+ "ᠫ": "p" # \u182b
371
+ "ᠴ": "q" # \u1834
372
+ "ᠷ": "r" # \u1837
373
+ "ᠰ": "s" # \u1830
374
+ "ᠲ": "t" # \u1832
375
+ "ᠦ": "u" # \u1826
376
+ "ᠸ": "w" # \u1838
377
+ "ᠱ": "x" # \u1831
378
+ "ᠶ": "y" # \u1836
379
+ "ᠽ": "z" # \u183d
380
+ "ᠣ": "o" # \u1823
381
+ # - "o" # General use
382
+ # - "ô" # For place names
383
+ "ᠤ": "u" # \u1824
384
+ # - "u" # General use
385
+ # - "û" # For place names
386
+ "ᠧ": "e" # \u1827
387
+ "ᠩ": "ng" # \u1829
388
+ "\u180e": "-" # MVS
389
+ "\u202f": "-" # NNBSP