interscript 0.1.7 → 2.1.0b1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (314) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +116 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +83 -133
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +68 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +68 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +76 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +68 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/lib/interscript/visualize.rb +61 -0
  63. data/lib/interscript/visualize/group.html.erb +59 -0
  64. data/lib/interscript/visualize/json.rb +57 -0
  65. data/lib/interscript/visualize/map.html.erb +46 -0
  66. data/lib/interscript/visualize/nodes.rb +89 -0
  67. data/requirements.txt +1 -0
  68. metadata +78 -416
  69. data/README.adoc +0 -298
  70. data/lib/g2pwrapper.py +0 -34
  71. data/lib/interscript/fs.rb +0 -69
  72. data/lib/interscript/mapping.rb +0 -142
  73. data/lib/interscript/opal.rb +0 -57
  74. data/lib/interscript/opal/entrypoint.rb +0 -12
  75. data/lib/interscript/opal/map_translate.rb +0 -7
  76. data/lib/interscript/opal/maps.js.erb +0 -10
  77. data/lib/model-7 +0 -0
  78. data/lib/tha-pt-b-7 +0 -0
  79. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  80. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  81. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  82. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  83. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
  84. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
  85. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  86. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  87. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  88. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  89. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  90. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  91. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  92. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  93. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
  94. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
  95. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  96. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  97. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  98. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  99. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  100. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  101. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  102. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  103. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  104. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  105. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  106. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  107. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  108. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  109. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  110. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  111. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  112. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
  113. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  114. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  115. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  116. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  117. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  118. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  119. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  120. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  121. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  122. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  123. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  124. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  125. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  126. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  127. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  128. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  129. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  130. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
  131. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  132. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  133. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  134. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  135. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  136. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  137. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  138. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  139. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  140. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  141. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  142. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  143. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  144. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  145. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  146. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  147. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  148. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  149. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  150. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  151. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
  152. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
  153. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  154. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  155. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  156. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  157. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  158. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  159. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  160. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  161. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  162. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  163. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  164. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  165. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  166. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  167. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  168. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  169. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  170. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  171. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  172. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  173. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  174. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  175. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  176. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  177. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  178. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  179. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  180. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  181. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  182. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  183. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  184. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  185. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  186. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  187. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  188. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  189. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  190. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  191. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  192. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  193. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  194. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  195. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  196. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  197. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  198. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  199. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  200. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  201. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  202. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  203. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  204. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  205. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  206. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  207. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  208. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  209. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  210. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  211. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  212. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  213. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
  214. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  215. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  216. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  217. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  218. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  219. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  220. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  221. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  222. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  223. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  224. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  225. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  226. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  227. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  228. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  229. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  230. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  231. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  232. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  233. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  234. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  235. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  236. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  237. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  238. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  239. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  240. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  241. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  242. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  243. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  244. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
  245. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  246. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  247. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  248. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  249. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  250. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  251. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  252. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  253. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  254. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  255. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  256. data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
  257. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  258. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  259. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  260. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  261. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  262. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  263. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  264. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  265. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  266. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  267. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  268. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  269. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  270. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  271. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  272. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  273. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  274. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  275. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  276. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  277. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  278. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  279. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  280. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  281. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  282. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  283. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  284. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  285. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  286. data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
  287. data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
  288. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  289. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  290. data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
  291. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  292. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  293. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  294. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  295. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  296. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  297. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  298. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  299. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  300. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  301. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  302. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  303. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  304. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  305. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  306. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  307. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  308. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  309. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  310. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  311. data/spec/interscript/filenames_spec.rb +0 -384
  312. data/spec/interscript/mapping_spec.rb +0 -42
  313. data/spec/interscript_spec.rb +0 -29
  314. data/spec/spec_helper.rb +0 -3
@@ -1,31 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: 1987-tl
4
- language: iso-639-2:ell
5
- source_script: Grek
6
- destination_script: Latn
7
- name: UNGEGN Greek v4.0
8
- url: http://www.eki.ee/wgrs/rom1_el.htm
9
- creation_date: 1987
10
- description: |
11
- UNGEGN Romanization table for Greek
12
-
13
- note:
14
- - Transliteration version (reversible). Also appears in annex B of ISO 843:1997. Originates in v1.0 of UNGEGN transliteration, 1987. This likely was the intended system in ELOT 743:1982 for transliteration, but the reversible character diacritics are missing from the document, and the document does not indicate what there was supposed to be.
15
-
16
- tests:
17
-
18
- - source: |
19
- Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
20
-
21
- Γιάννης Μακρυγιάννης.
22
-
23
- expected: |
24
- Éna práma mónon me parakíni̱se ki eména na grápso̱ óti toúti̱n ti̱n patrída ti̱n échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai fto̱choí kai politikoí kai stratio̱tikoí kai oi pléon mikróteroi ánthro̱poi; ósoi ago̱nistí̱kamen, analógo̱s o katheís, échomen na zí̱somen edó̱. To loipón doulépsamen óloi mazí, na ti̱n fylámen ki óloi mazí kai na mi̱n légei oúte o dynatós «egó̱» oúte o adýnatos. Xérete póte na légei o katheís «egó̱»? Ótan ago̱nisteí mónos tou kai fkiásei í̱ chalásei, na légei «egó̱»; ótan ómo̱s ago̱nízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egó̱». Kai eis to exí̱s na máthomen gnó̱si̱, an thélomen na fkiásomen cho̱rión, na zí̱somen óloi mazí.
25
-
26
- Giánni̱s Makrygiánni̱s.
27
-
28
- map:
29
- character_separator: ""
30
- word_separator: " "
31
- inherit: "elot-ell-Grek-Latn-743-1982-tl"
@@ -1,19 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: 1987-tl
4
- language: iso-639-2:ell
5
- source_script: Grek
6
- destination_script: Latn
7
- name: UNGEGN Greek v4.0
8
- url: http://www.eki.ee/wgrs/rom1_el.htm
9
- creation_date: 1987
10
- description: |
11
- UNGEGN Romanization table for Greek
12
-
13
- note:
14
- - Transcription version
15
-
16
- map:
17
- character_separator: ""
18
- word_separator: " "
19
- inherit: "elot-ell-Grek-Latn-743-1982-ts"
@@ -1,222 +0,0 @@
1
- ---
2
- authority_id: ungegn
3
- id: 2016
4
- language: iso-639-2:hin
5
- source_script: Deva
6
- destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
8
- url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
- creation_date: 1972
10
- confirmation_date: 2016
11
- description: |
12
- The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
- (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
- published in volume II of the conference reports.
15
-
16
- There is no evidence of the use of the system either in India or in international cartographic
17
- products. It was stated in 1987 that the appropriate resolution had not been implemented in
18
- India and the Hunterian system was still in use in large-scale mapping
19
-
20
- Hindi uses the alphasyllabic script Devanāgarī whereby each character represents a syllable
21
- rather than one sound. Vowels and diphthongs are marked in two ways: as independent
22
- characters (used syllable-initially) and in an abbreviated form, to denote vowels after
23
- consonants. The romanization table is unambiguous but the user would have to recognize
24
- many ligatures not given in the original table (only three are given). The system is mostly
25
- reversible but there may exist some ambiguities in the romanization of vowels (independent
26
- vs. abbreviated characters) and consonants
27
-
28
- notes:
29
- - |
30
- It is recommended that the vowel अ (a) should always be romanized except when it ends a
31
- name. If a name ends with a consonant, the consonant should carry a sub-macron. Such
32
- cases, however, will be very rare. For example, कानपुर Kānapur (not Kānapura), जगत्
33
- Jagaṯ.
34
- - |
35
- If each letter of a digraph or any two parts of a trigraph has a distinct independent sound
36
- then it should be indicated by a hyphen, thus d-h.
37
-
38
- tests:
39
- - source: "परिपक्क"
40
- expected: "paraipakka"
41
- - source: "जगत्"
42
- expected: "jagat"
43
- - source: "संख्या"
44
- expected: "saṁkhyaā"
45
- - source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
46
- expected: "gaṁbhaīra maraījaoṁ kae maāmalae maeṁ bhaārata daūsarae naṁbara para"
47
- - source: "कोरोना अपडेट्स"
48
- expected: "kaoraonaā apaḍaeṭsa"
49
- - source: "सीडीसी चीफ का बयान अहम"
50
- expected: "saīḍaīsaī chaīpha kaā bayaāna ahama"
51
- - source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
52
- expected: "gaūgala plae sṭaora para paeṭaīema kaī vaāpasaī"
53
- - source: "भारत में गैंबलिंग की इजाजत नहीं"
54
- expected: "bhaārata maeṁ gaaiṁbalaiṁga kaī ijaājata nahaīṁ"
55
- - source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
56
- expected: "kaoraonaā vaaiksaīna mauddae para ghairae raāṣhṭrapatai; jao baāiḍaena baolae- maujhae aura daesha kao vaaijñaānaikaoṁ para bharaosaā haai, ḍaonaālḍa ṭrampa para nahaīṁ"
57
- - source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
58
- expected: "gaūgala kaī kaārravaāī para paeṭaīema nae kahaā thaā kai aipa kao asthaāyaī taaura para plae-sṭaora sae haṭaāyaā gayaā haai, āpakae paaisae saurakṣhaita haaiṁ"
59
- map:
60
-
61
- characters:
62
-
63
- # I. Independent vowel characters
64
- 'अ': 'a'
65
- 'आ': 'ā'
66
- 'इ': 'i'
67
- 'ई': 'ī'
68
- 'उ': 'u'
69
- 'ऊ': 'ū'
70
- 'ऋ': 'ṛ'
71
- 'ॠ': 'ṝ'
72
- 'ऌ': 'l̤'
73
- 'ए': 'e'
74
- 'ऐ': 'ai'
75
- 'ओ': 'o'
76
- 'औ': 'au'
77
-
78
- # II. Abbreviated vowel characters
79
-
80
- 'ा': "ā" # का
81
- 'ॉ': "ā̆ " # additional mark: कॉ
82
- 'ि': "i" # कि i
83
- 'ी': "ī" # की
84
- 'ु': "u" # कु
85
- 'ू': "ū" # कू
86
- 'ृ': "ṛ" # कृ
87
- 'े': "e" # के
88
- 'ै': "ai" # कै
89
- 'ो': "o" # को
90
- 'ौ': "au" # कौ
91
-
92
-
93
- # Consonants (see Note 1)
94
-
95
- # Gutturals
96
- 'क': 'ka'
97
- 'ख': 'kha'
98
- 'ग': 'ga'
99
- 'घ': 'gha'
100
- 'ङ': 'ṅa'
101
-
102
- # Palatals
103
- 'च': 'cha'
104
- 'छ': 'chha'
105
- 'ज': 'ja'
106
- 'झ': 'jha'
107
- 'ञ': 'ña'
108
-
109
- # Cerebrals
110
- 'ट': 'ṭa'
111
- 'ठ': 'ṭha'
112
- 'ड': 'ḍa'
113
- 'ढ': 'ḍha'
114
- 'ण': 'ṇa'
115
-
116
- # Dentals
117
- 'त': 'ta'
118
- 'थ': 'tha'
119
- 'द': 'da'
120
- 'ध': 'dha'
121
- 'न': 'na'
122
-
123
- # Labials
124
- 'प': 'pa'
125
- 'फ': 'pha'
126
- 'ब': 'ba'
127
- 'भ': 'bha'
128
- 'म': 'ma'
129
-
130
- # Semivowels
131
- 'य': 'ya'
132
- 'र': 'ra'
133
- 'ल': 'la'
134
- 'व': 'va'
135
-
136
- # Sibilants
137
- 'श': 'sha'
138
- 'ष': 'ṣha'
139
- 'स': 'sa'
140
-
141
- # Dotted variants
142
- 'क़': 'qa'
143
- 'ख़': 'ḳha'
144
- 'ग़': 'ġa'
145
- 'ज़': 'za'
146
- 'ड़': 'ṙa'
147
- 'ढ़': 'ṙha'
148
- 'फ़': 'fa'
149
-
150
-
151
- # Aspirate
152
- 'ह': 'ha'
153
-
154
- # Anusvāra
155
- 'ं': 'ṁ'
156
-
157
- # Anunāsika
158
- 'ँ': 'm̐'
159
-
160
- # halanta
161
- '्': ''
162
-
163
- # bisharga
164
- 'ः' : 'ḥ'
165
-
166
- #V. Ligatures(To cover all Ligatures at unicode)
167
- # Implemnting Pronunciation without a vowel: क् k.
168
-
169
- # Gutturals
170
- 'क्': 'k'
171
- 'ख्': 'kh'
172
- 'ग्': 'g'
173
- 'घ्': 'gh'
174
- 'ङ्': 'ṅ'
175
-
176
- # Palatals
177
- 'च्': 'ch'
178
- 'छ्': 'chh'
179
- 'ज्': 'j'
180
- 'झ्': 'jh'
181
- 'ञ्': 'ñ'
182
-
183
- # Cerebrals
184
- 'ट्': 'ṭ'
185
- 'ठ्': 'ṭh'
186
- 'ड्': 'ḍ'
187
- 'ढ्': 'ḍh'
188
- 'ण्': 'ṇ'
189
-
190
- # Dentals
191
- 'त्': 't'
192
- 'थ्': 'th'
193
- 'द्': 'd'
194
- 'ध्': 'dh'
195
- 'न्': 'n'
196
-
197
- # Labials
198
- 'प्': 'p'
199
- 'फ्': 'ph'
200
- 'ब्': 'b'
201
- 'भ्': 'bh'
202
- 'म्': 'm'
203
-
204
- # Semivowels
205
- 'य्': 'y'
206
- 'र्': 'r'
207
- 'ल्': 'l'
208
- 'व्': 'v'
209
-
210
- # Sibilants
211
- 'श्': 'sh'
212
- 'ष्': 'ṣh'
213
- 'स्': 's'
214
-
215
- # Dotted variants
216
- 'क़्': 'q'
217
- 'ख़्': 'ḳh'
218
- 'ग़्': 'ġ'
219
- 'ज़्': 'z'
220
- 'ड़्': 'ṙ'
221
- 'ढ़्': 'ṙh'
222
- 'फ़्': 'f'
@@ -1,91 +0,0 @@
1
- ---
2
- authority_id: ungegn
3
- id: 2016
4
- language: iso-639-2:hin
5
- source_script: Deva
6
- destination_script: Latn
7
- name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Marathi Romanization, 1972
8
- url: https://www.eki.ee/wgrs/rom1_mr.pdf
9
- creation_date: 1972
10
- confirmation_date: 2016
11
- description: |
12
- The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
- (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
- published in volume II of the conference reports
15
-
16
- There is no evidence of the use of the system either in India or in international cartographic
17
- products.
18
-
19
- Marathi (Marāṭhī) uses the alphasyllabic script Devanāgarī.
20
-
21
- notes:
22
- - |
23
- Additional characters (absent in Hindi):
24
- ळ ḷa
25
- ऍ ă (abbreviated: कॅ kă)
26
-
27
- - |
28
- Ligatures may be formed with r as the first component: 'ऱ्य': 'rya' 'ऱ्ह': 'rha'
29
- - |
30
- Typical are ligatures ending in h: न्ह nh, म्ह mh, ल्ह lh, व्ह vh.
31
- - |
32
- The following independent characters are sometimes used: अि i, अी ī, अु u, अू ū, अे e, अै ai.
33
-
34
- tests:
35
- - source: "परिपक्क"
36
- expected: "paraipakka"
37
- - source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
38
- expected: "ṭhaāṇae - jailhayaāta baudhavaāraī eka hajaāra raugṇaāṁchaī vaāḍha, tara jaṇaāṁchyaā maṛtyaūchaī naoṁda"
39
- - source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
40
- expected: "ekataā kapaūra paunhaā aḍakalaī vaādaāta, vaebasaīraijamadhalyaā 'tyaā' saīnamauḷae jamaāvaāchaī gharaāvara dagaḍaphaeka"
41
- - source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
42
- expected: "jaāṇaūna ghyaā, baīemasaīchyaā adhaikaāryaāṁnaī kaṁganaā raāṇaautachyaā ôphaisamadhalae nakkaī kaāya- kaāya taoḍalaṁ"
43
- - source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
44
- expected: "kaṁganaā mauṁbaīta daākhala haoṇyaāpaūrvaī 'maātaoshraī'varaūna pharmaāna sauṭalae; pravaktyaāṁnaā sakta ādaesha"
45
- - source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
46
- expected: "maraāṭhaā ārakṣhaṇaāsa taātpaurataī sthagaitaī; sarvaochcha nyaāyaālayaāchaā nairṇaya"
47
- - source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
48
- expected: "bhaārataāchyaā tainhaī lashaīṁchaā pahailaā ṭappaā yashasvaī, vaāchaā kadhaī yaeṇaāra baājaāraāta"
49
- - source: "रुग्णवाढीमुळे खाटांची चणचण"
50
- expected: "raugṇavaāḍhaīmauḷae khaāṭaāṁchaī chaṇachaṇa"
51
- - source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
52
- expected: "paīema svanaidhaī karja yaojanaelaā mauṁbaītaūna alpa prataisaāda"
53
- - source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
54
- expected: "saāṁtaākraūjha-chaeṁbaūra laiṁka raoḍavaraīla unnata maārgaālaā sthagaitaī"
55
- - source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
56
- expected: "saṁpaādaka arṇaba gaosvaāmaī yaāṁchyaāvairaūddha khaḍaka paolaisa ṭhaāṇyaāta takraāra"
57
- - source: "करणाऱ्या मुलांना अनुक्रमे प्ले ग्रूप"
58
- expected: "karaṇaāryaā maulaāṁnaā anaukramae plae graūpa"
59
- - source: "राज्यातील शाळा दिवाळीपर्यंत बंद, मंत्र्यांच्या बैठकीत निर्णय, शिक्षकांची जबाबदारी वाढली"
60
- expected: "raājyaātaīla shaāḷaā daivaāḷaīparyaṁta baṁda, maṁtryaāṁchyaā baaiṭhakaīta nairṇaya, shaikṣhakaāṁchaī jabaābadaāraī vaāḍhalaī"
61
-
62
- map:
63
- inherit: "un-hin-Deva-Latn-2016"
64
-
65
- rules:
66
- # note[3]
67
- - pattern: (?<=)\U+0939(?=\b)
68
- result: "h"
69
-
70
- characters:
71
-
72
- # Note 1
73
- 'ळ': 'ḷa'
74
- 'ऍ': 'ă'
75
-
76
- # Note 2
77
- 'ऱ': 'r' # used for making Ligatures 'ऱ्य': 'rya' 'ऱ्ह': 'rha'
78
-
79
- # Note 4
80
- 'अि': 'i'
81
- 'अी': 'ī'
82
- 'अु': 'u'
83
- 'अू': 'ū'
84
- 'अे': 'e'
85
- 'अै': 'ai'
86
-
87
- 'ॲ': 'ê'
88
- 'ऑ': 'ô'
89
-
90
-
91
-
@@ -1,264 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: general-2013
4
- language: iso-639-2:mon
5
- source_script: Mong
6
- destination_script: Latn
7
- name: Mongolian Romanization in China, Version 4.0 (general)
8
- url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
- creation_date: 2013-09
10
- description: |
11
- The United Nations resolution III/8 in 1977 recognized the Scheme for
12
- a Chinese Phonetic Alphabet (Pinyin) as China’s official Roman alphabet
13
- scheme and recommended the alphabet as the international system for the
14
- romanization of Chinese geographical names. In China Mongolian
15
- geographical names are transcribed directly from the Mongolian script
16
- into Pinyin. The scheme was published in Toponymic Guidelines for Map
17
- and Other Editors: China, 1982.
18
-
19
- The system is used in China and in international cartographic
20
- products.
21
-
22
- Mongolian uses a vertical script. Transcription of Mongolian names is
23
- made from their proper pronunciation based on the written form of the
24
- Mongolian language and Qahar vernacular, with Zhenglan as its
25
- representative pronunciation. Due to the complex nature of the script
26
- the romanization scheme is not reversible, e.g. the name of the city
27
- Hohhot is written ᠬᠥᠬᠡᠬᠣᠲᠠ but may be transliterated as kökeqota.
28
-
29
- notes:
30
- - The long and short Mongolian vowels are not distinguished in the
31
- spelling for general use, but in recording the pronunciation of
32
- place-names, the long vowel is represented by duplication.
33
- - Where two Roman equivalents are given, the second (in brackets) is
34
- used for recording the pronunciation of place-names while the first
35
- form is for general use.
36
- - In the table only word-initial character variants are shown.
37
- Depending on the position in the word many variants of the characters
38
- are used as well as some ligatures. These features are not covered here.
39
- - For technical reasons the characters of the Mongolian script are
40
- turned 90˚ anti-clockwise.
41
-
42
- implementation_notes:
43
- - A separated final form of vowels a or e is common, and can appear at the end
44
- of a word, word stem, or suffix. This form requires a final-shaped preceding
45
- consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
46
- and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
47
- with a hyphen. In digital typesetting, these forms are triggered by inserting
48
- a U+180E ᠎ MONGOLIAN VOWEL SEPARATOR (HTML &#6158; · MVS) between the consonant
49
- and vowel.
50
- - All case suffixes, as well as any plural suffixes consisting of one or two
51
- syllables are likewise separated by a preceding and hyphen-transliterated gap.
52
- In digital typesetting, this gap is represented by a U+202F   NARROW NO-BREAK SPACE
53
- (HTML &#8239; · NNBSP). A maximum of two case suffixes can be added to a stem.
54
- Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
55
- as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
56
- 'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
57
- medial- (vowels), or variant-shaped form.
58
-
59
- tests:
60
- - source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
61
- expected: ordos hota
62
- - source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
63
- expected: bayannagur hota
64
- - source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
65
- expected: ulaganhota
66
- - source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
67
- expected: hoolia goul hota
68
- - source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
69
- expected: eriyen hota
70
- - source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
71
- expected: rasiyan hota
72
- - source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
73
- expected: bagarin baragun hosigu
74
- - source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
75
- expected: bagarin jegun hosigu
76
- - source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
77
- expected: tungliyou hota
78
- - source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
79
- expected: sili-yin hota
80
- - source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
81
- expected: horin ger siyan
82
- - source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
83
- expected: uda togorig
84
- - source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
85
- expected: uhai hota
86
- - source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
87
- expected: hayinan togorig
88
- - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
89
- expected: hayirub-un tohoi togorig
90
- - source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
91
- expected: ulaganqab hota
92
- - source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
93
- expected: jining togorig
94
- - source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
95
- expected: fwngjwe hota
96
- - source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
97
- expected: juwezi siyan
98
- - source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
99
- expected: huwade siyan
100
- - source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
101
- expected: xangdu siyan
102
- - source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
103
- expected: singhe siyan
104
- - source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
105
- expected: liyangqang siyan
106
- - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
107
- expected: qahar baragun garun emunedu hosigu
108
- - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
109
- expected: qahar baragun garun dumdadu hosigu
110
- - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
111
- expected: qahar baragun garun hoyitu hosigu
112
- - source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
113
- expected: dorbed hosigu
114
- - source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
115
- expected: bugutu hota
116
- - source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
117
- expected: hondelen togorig
118
- - source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
119
- expected: dunghe togorig
120
- - source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
121
- expected: qingxan togorig
122
- - source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
123
- expected: siguyitu togorig
124
- - source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
125
- expected: jiu yuwan togorig
126
- - source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
127
- expected: guyang siyan
128
- - source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
129
- expected: tumed jegun hosigu
130
- - source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
131
- expected: tumed baragun hosigu
132
- - source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
133
- expected: darhan muumingg᠋an holbogatu hosigu
134
- - source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
135
- expected: hesigten hosigu
136
- - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
137
- expected: sin-e bargu jegun hosigu
138
- - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
139
- expected: sin-e bargu baragun hosigu
140
- - source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
141
- expected: otog hosigu
142
- - source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
143
- expected: d᠋ungxeng togorig
144
- - source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
145
- expected: dalad hosigu
146
- - source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
147
- expected: jegungar hosigu
148
- - source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
149
- expected: otog-un emunedu hosigu
150
- - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
151
- expected: hanggin hosigu
152
- - source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
153
- expected: uusin hosigu
154
- - source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
155
- expected: ejin horog-a hosigu
156
- - source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
157
- expected: jalan ai᠌l hota
158
- - source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
159
- expected: yagsi hota
160
- - source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
161
- expected: manjuur hota
162
- - source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
163
- expected: hayilar togorig
164
- - source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
165
- expected: horqin togorig
166
- - source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
167
- expected: kayilu siyan
168
- - source: ᠬᠦᠷᠢᠶ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
169
- expected: huriy-e hosigu
170
- - source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
171
- expected: naiman hosigu
172
- - source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
173
- expected: jarud hosigu
174
- - source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
175
- expected: horqin baragun garun dumdadu hosigu
176
- - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
177
- expected: horqin jegun garun dumdadu hosigu
178
- - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
179
- expected: horqin jegun garun hoyitu hosigu
180
- - source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
181
- expected: ulaganhada hota
182
- - source: ᠰᠡᠷᠡᠴᠢ # Salaqi
183
- expected: sereqi
184
- - source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
185
- expected: gegen goul hota
186
- - source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
187
- expected: alaxa jegun hosigu
188
- - source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
189
- expected: alaxa baragun hosigu
190
- - source: ᠡᠵᠡᠨ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
191
- expected: ejen-e hosigu
192
- - source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
193
- expected: hobegetu sir-a hosigu
194
- - source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
195
- expected: uyuwan siyan
196
- - source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
197
- expected: uquwan siyan
198
- - source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
199
- expected: tuqiuwan siyan
200
- - source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
201
- expected: ningqeng siyan
202
- - source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
203
- expected: linsi siyan
204
- - source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
205
- expected: linhe togorig
206
- - source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
207
- expected: haraqin hosigu
208
- - source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
209
- expected: d᠋engkeu siyan
210
- - source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
211
- expected: auhan hosigu
212
- - source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
213
- expected: qing xui he siyan
214
- - source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
215
- expected: hodong arad-un togorig
216
- - source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
217
- expected: sayihan togorig
218
- - source: ᠰᠢᠨ᠎ᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
219
- expected: sin-e hota togorig
220
- - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
221
- expected: hayirub-un tohoi togorig
222
- - source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
223
- expected: sung xan togorig
224
- - source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
225
- expected: hung xan togorig
226
- - source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
227
- expected: arun hosigu
228
- - source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
229
- expected: yuwan boo xan togorig
230
- - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
231
- expected: silugun hobegetu qagan hosigu
232
- - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
233
- expected: silugun hohe hosigu
234
- - source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
235
- expected: urad-un dumdadu hosigu
236
- - source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
237
- expected: urad-un emunedu hosigu
238
- - source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
239
- expected: togtahu siyan
240
- - source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
241
- expected: tayipuse hosigu
242
- - source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
243
- expected: soned jegun hosigu
244
- - source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
245
- expected: soned baragun hosigu
246
- - source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
247
- expected: ongnigud hosigu
248
- - source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
249
- expected: jalaid hosigu
250
- - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
251
- expected: hanggin hoyitu hosigu
252
- - source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
253
- expected: jegun ujumuqin hosigu
254
- - source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
255
- expected: aru horqin hosigu
256
- - source: ᠠᠪᠠᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
257
- expected: abag-a hosigu
258
- - source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
259
- expected: buriyad
260
- - source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
261
- expected: ulaganbagatur
262
-
263
- map:
264
- inherit: sasm-mon-Mong-Latn-general-1978