interscript 0.1.9 → 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (352) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +53 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +80 -135
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +67 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +26 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +61 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +65 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/requirements.txt +1 -0
  63. metadata +73 -458
  64. data/README.adoc +0 -296
  65. data/aliases.json +0 -1
  66. data/lib/g2pwrapper.py +0 -34
  67. data/lib/interscript/fs.rb +0 -96
  68. data/lib/interscript/mapping.rb +0 -144
  69. data/lib/interscript/opal.rb +0 -196
  70. data/lib/interscript/opal/entrypoint.rb +0 -20
  71. data/lib/interscript/opal/exports.rb +0 -11
  72. data/lib/interscript/opal/maps.js.erb +0 -8
  73. data/lib/model-7 +0 -0
  74. data/lib/tha-pt-b-7 +0 -0
  75. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  76. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  77. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  78. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  79. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
  80. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
  81. data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
  82. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  83. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  84. data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
  85. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  86. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  87. data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
  88. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  89. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  90. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  91. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  92. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
  93. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
  94. data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
  95. data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
  96. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  97. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  98. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  99. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  100. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  101. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  102. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  103. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  104. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  105. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  106. data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
  107. data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
  108. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  109. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  110. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  111. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  112. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  113. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  114. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  115. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
  116. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  117. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  118. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  119. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  120. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  121. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  122. data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
  123. data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
  124. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  125. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  126. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  127. data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
  128. data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
  129. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  130. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  131. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  132. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  133. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  134. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  135. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  136. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  137. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
  138. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  139. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
  140. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  141. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
  142. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  143. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  144. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  145. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  146. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
  147. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  148. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  149. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
  150. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  151. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
  152. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  153. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  154. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  155. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
  156. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
  157. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  158. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  159. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  160. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
  161. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  162. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  163. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  164. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  165. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
  166. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
  167. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  168. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
  169. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  170. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  171. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
  172. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  173. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  174. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  175. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  176. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  177. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
  178. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  179. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  180. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  181. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  182. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  183. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  184. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  185. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
  186. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  187. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
  188. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  189. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  190. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  191. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  192. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  193. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  194. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  195. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  196. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  197. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  198. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  199. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  200. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  201. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  202. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  203. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  204. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  205. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  206. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  207. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  208. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  209. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  210. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  211. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  212. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  213. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  214. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  215. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  216. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  217. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  218. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  219. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  220. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  221. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  222. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  223. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  224. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  225. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  226. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  227. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  228. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  229. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  230. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
  231. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  232. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  233. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  234. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  235. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  236. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  237. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  238. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  239. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  240. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  241. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  242. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  243. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  244. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  245. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  246. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  247. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  248. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  249. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  250. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  251. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  252. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  253. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  254. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  255. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  256. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  257. data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
  258. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  259. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  260. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  261. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  262. data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
  263. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
  264. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  265. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  266. data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
  267. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  268. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  269. data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
  270. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  271. data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
  272. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  273. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  274. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  275. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  276. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  277. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
  278. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  279. data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
  280. data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
  281. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  282. data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
  283. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  284. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  285. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  286. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
  287. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  288. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
  289. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  290. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  291. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  292. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  293. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  294. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  295. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  296. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  297. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  298. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  299. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  300. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  301. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  302. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  303. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  304. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  305. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  306. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  307. data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
  308. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  309. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  310. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  311. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  312. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  313. data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
  314. data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
  315. data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
  316. data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
  317. data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
  318. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  319. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  320. data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
  321. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  322. data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
  323. data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
  324. data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
  325. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  326. data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
  327. data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
  328. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  329. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  330. data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
  331. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
  332. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
  333. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  334. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  335. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  336. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  337. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  338. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  339. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  340. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  341. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  342. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  343. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  344. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  345. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  346. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  347. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  348. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  349. data/spec/interscript/filenames_spec.rb +0 -21
  350. data/spec/interscript/mapping_spec.rb +0 -42
  351. data/spec/interscript_spec.rb +0 -37
  352. data/spec/spec_helper.rb +0 -3
@@ -1,289 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 1979
4
- language: iso-639-2:bel
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: United States Board on Geographic Names Foreign Names Committee Staff, 1994. Romanization Systems and Roman-Script Spelling Conventions, p. 23.
8
- alias:
9
- ogc11122:
10
- code: bel_Cyrl2Latn_BGN_1979
11
- description: Byelorussian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1979 System
12
- url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811510/ROMANIZATION_OF_BELARUSIAN.pdf
13
- creation_date: 1979
14
- description: |
15
- The BGN/PCGN system for Belarusian (formerly referred to as Byelorussian) was designed for use in
16
- romanizing names written in the Belarusian Cyrillic alphabet. The Belarusian alphabet contains three
17
- characters not present in the Russian alphabet: і, ў, and ’.
18
-
19
- notes:
20
- - The character sequences зг, кг, сг, тс and цг and may be romanized z·h, k·h, s·h, t·s and ts·h in order to differentiate those romanizations from the digraphs zh, kh, sh, ts, and the letter sequence tsh, which are used to render the characters ж, x, ш, ц, and the character sequence тш
21
- - All apostrophes appearing in romanization are Unicode encoding 2019.
22
-
23
- tests:
24
- - source: Антон
25
- expected: Anton
26
- - source: Вілейка
27
- expected: Vilyeyka
28
- - source: Брэст
29
- expected: Brest
30
- - source: Дубна
31
- expected: Dubna
32
- - source: Віцебск
33
- expected: Vitsyebsk
34
- - source: Асіповічы
35
- expected: Asipovichy
36
- - source: Гродна
37
- expected: Hrodna
38
- - source: Брагін
39
- expected: Brahin
40
- - source: Добруш
41
- expected: Dobrush
42
- - source: Ліда
43
- expected: Lida
44
- - source: Гомель
45
- expected: Homyel’
46
- - source: Беліца
47
- expected: Byelitsa
48
- - source: Ёдкавічы
49
- expected: Yodkavichy
50
- - source: Нёман
51
- expected: Nyoman
52
- - source: Жлобін
53
- expected: Zhlobin
54
- - source: Ружаны
55
- expected: Ruzhany
56
- - source: Зоя
57
- expected: Zoya
58
- - source: князь
59
- expected: knyaz’
60
- - source: Ігнат
61
- expected: Ihnat
62
- - source: Мінск
63
- expected: Minsk
64
- - source: Йосель
65
- expected: Yosyel’
66
- - source: Койданава
67
- expected: Koydanava
68
- - source: Крапіўна
69
- expected: Krapiwna
70
- - source: Менск
71
- expected: Myensk
72
- - source: Лаўна
73
- expected: Lawna
74
- - source: Лёсік
75
- expected: Lyosik
76
- - source: Купала
77
- expected: Kupala
78
- - source: Вілейка
79
- expected: Vilyeyka
80
- - source: Міхал
81
- expected: Mikhal
82
- - source: Вільня
83
- expected: Vil’nya
84
- - source: Лепель
85
- expected: Lyepyel’
86
- - source: Магілёў
87
- expected: Mahilyow
88
- - source: Няміга
89
- expected: Nyamiha
90
- - source: Наваградак
91
- expected: Navahradak
92
- - source: Баранавічы
93
- expected: Baranavichy
94
- - source: Орша
95
- expected: Orsha
96
- - source: Востраў
97
- expected: Vostraw
98
- - source: Пінск
99
- expected: Pinsk
100
- - source: Дняпро
101
- expected: Dnyapro
102
- - source: Рагачоў
103
- expected: Rahachow
104
- - source: Сураж
105
- expected: Surazh
106
- - source: Смаляны
107
- expected: Smalyany
108
- - source: Арэса
109
- expected: Aresa
110
- - source: Рось
111
- expected: Ros’
112
- - source: Талочын
113
- expected: Talochyn
114
- - source: Масты
115
- expected: Masty
116
- - source: Уладзімір
117
- expected: Uladzimir
118
- - source: Бабруйск
119
- expected: Babruysk
120
- - source: Быхаў
121
- expected: Bykhaw
122
- - source: Воўпа
123
- expected: Vowpa
124
- - source: Іўе
125
- expected: Iwye
126
- - source: Фолюш
127
- expected: Folyush
128
- - source: фортка
129
- expected: fortka
130
- - source: Хатынь
131
- expected: Khatyn’
132
- - source: Быхаў
133
- expected: Bykhaw
134
- - source: Ганцавічы
135
- expected: Hantsavichy
136
- - source: Стоўбцы
137
- expected: Stowbtsy
138
- - source: цьмяны
139
- expected: ts’myany
140
- - source: мясцовы
141
- expected: myastsovy
142
- - source: Астравец
143
- expected: Astravyets
144
- - source: Прыпяць
145
- expected: Prypyats’
146
- - source: Чэрыкаў
147
- expected: Cherykaw
148
- - source: Шчара
149
- expected: Shchara
150
- - source: Нарач
151
- expected: Narach
152
- - source: Шклоў
153
- expected: Shklow
154
- - source: Ашмяны
155
- expected: Ashmyany
156
- - source: Ыттык-Кёль
157
- expected: Yttyk-Kyol’
158
- - source: Кобрын
159
- expected: Kobryn
160
- - source: Солы
161
- expected: Soly
162
- - source: Копысь
163
- expected: Kopys’
164
- - source: рунь
165
- expected: run’
166
- - source: Эйсманты
167
- expected: Eysmanty
168
- - source: Крэва
169
- expected: Kreva
170
- - source: Юры
171
- expected: Yury
172
- - source: уюн
173
- expected: uyun
174
- - source: Язэп
175
- expected: Yazep
176
- - source: Івянец
177
- expected: Ivyanyets
178
- - source: з’езд
179
- expected: z”yezd
180
- - source: Вялiкiя Вераб’евічы
181
- expected: Vyalikiya Vyerab”yevichy
182
- - source: Дзям’янаўцы
183
- expected: Dzyam”yanawtsy
184
- - source: Задвор’е
185
- expected: Zadvor”ye
186
- - source: Гезгалы
187
- expected: Hyez·haly
188
- - source: Вадасховішча Гезгальскае
189
- expected: Vadaskhovishcha Hyez·hal’skaye
190
-
191
- map:
192
- postrules:
193
- - pattern: '\u042C' # Ь
194
- result: "\u2019"
195
- - pattern: '\u044C' # ь
196
- result: "\u2019"
197
- # Per documentation those rules are optional
198
- rules:
199
- - pattern: \u0417\u0413 # ЗГ
200
- result: "Z\u00B7H" # Z·H
201
- - pattern: \u0437\u0433 # зг
202
- result: "z\u00B7h" # z·h
203
- - pattern: \u041A\u0413 # КГ
204
- result: "K\u00B7H" # K·H
205
- - pattern: \u043A\u0433 # кг
206
- result: "k\u00B7h" # k·h
207
- - pattern: \u0421\u0413 # СГ
208
- result: "S\u00B7H" # S·H
209
- - pattern: \u0441\u0433 # сг
210
- result: "s\u00B7h" # s·h
211
- - pattern: \u0422\u0421 # ТС
212
- result: "T\u00B7S" # T·S
213
- - pattern: \u0442\u0441 # тс
214
- result: "t\u00B7s" # t·s
215
- - pattern: \u0426\u0413 # ЦГ
216
- result: "TS\u00B7H" # TS·H
217
- - pattern: \u0446\u0433 # цг
218
- result: "ts\u00B7h" # ts·h
219
-
220
- characters:
221
- '\u00B4' : "\u201D" # apostrophe according to spec
222
- '\u02BC' : "\u201D" # apostrophe according to spec
223
- '\u2019' : "\u201D" # apostrophe in actual examples
224
-
225
- '\u0410' : 'A' # A
226
- '\u0411' : 'B' # Б
227
- '\u0412' : 'V' # B
228
- '\u0413' : 'H' # Г
229
- '\u0414' : 'D' # Д
230
- '\u0415' : 'Ye' # Е
231
- '\u0401' : 'Yo' # Ё
232
- '\u0416' : 'Zh' # Ж
233
- '\u0417' : 'Z' # З
234
- '\u0406' : 'I' # І
235
- '\u0419' : 'Y' # Й
236
- '\u041A' : 'K' # К
237
- '\u041B' : 'L' # Л
238
- '\u041C' : 'M' # М
239
- '\u041D' : 'N' # Н
240
- '\u041E' : 'O' # О
241
- '\u041F' : 'P' # П
242
- '\u0420' : 'R' # Р
243
- '\u0421' : 'S' # С
244
- '\u0422' : 'T' # Т
245
- '\u0423' : 'U' # У
246
- '\U040E' : 'W' # Ў
247
- '\u0424' : 'F' # Ф
248
- '\u0425' : 'Kh' # Х
249
- '\u0426' : 'Ts' # Ц
250
- '\u0427' : 'Ch' # Ч
251
- '\u0428' : 'Sh' # Ш
252
- '\u042B' : 'Y' # Ы
253
- '\u042D' : 'E' # Э
254
- '\u042E' : 'Yu' # Ю
255
- '\u042F' : 'Ya' # Я
256
- '\u0490' : 'G' # Ґ
257
-
258
- '\u0430' : 'a' # а
259
- '\u0431' : 'b' # б
260
- '\u0432' : 'v' # в
261
- '\u0433' : 'h' # г
262
- '\u0434' : 'd' # д
263
- '\u0435' : 'ye' # е
264
- '\u0451' : 'yo' # ё
265
- '\u0436' : 'zh' # ж
266
- '\u0437' : 'z' # з
267
- '\u0456' : 'i' # і
268
- '\u0439' : 'y' # й
269
- '\u043A' : 'k' # к
270
- '\u043B' : 'l' # л
271
- '\u043C' : 'm' # м
272
- '\u043D' : 'n' # н
273
- '\u043E' : 'o' # о
274
- '\u043F' : 'p' # п
275
- '\u0440' : 'r' # р
276
- '\u0441' : 's' # с
277
- '\u0442' : 't' # т
278
- '\u0443' : 'u' # у
279
- '\u045E' : 'w' # ў
280
- '\u0444' : 'f' # ф
281
- '\u0445' : 'kh' # х
282
- '\u0446' : 'ts' # ц
283
- '\u0447' : 'ch' # ч
284
- '\u0448' : 'sh' # ш
285
- '\u044B' : 'y' # ы
286
- '\u044D' : 'e' # э
287
- '\u044E' : 'yu' # ю
288
- '\u044F' : 'ya' # я
289
- '\u0491' : 'g' # ґ
@@ -1,119 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 1952
4
- language: iso-639-2:bul
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: ROMANIZATION SYSTEM FOR BULGARIAN BGN/PCGN of 1952
8
- alias:
9
- ogc11122:
10
- code: bul_Cyrl2Latn_BGN_1952
11
- description: Bulgarian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) Bulgarian 1952 System
12
- url: https://libraries.ucsd.edu/bib/fed/USBGN_romanization.pdf
13
- creation_date: 1945
14
- confirmation_date: 1952
15
- description: |
16
- This system was adopted by the BGN in 1949 and by the PCGN in 1952. It
17
- reflects the much simplified Bulgarian orthography as officially revised in
18
- February 1945. The Bulgarian alphabet contains all of the characters present
19
- in the Russian alphabet with the exception of ё, ы, and э. Notes 1, 2, and 3
20
- are applicable to sources predating the orthographic reform of 1945.
21
-
22
- notes:
23
- - In modern Bulgarian orthography, the character ъ, does not occcur in word-final position. It should be omitted in romanization when found in word-final position on older sources
24
- - The obsolete character ѫ, which was replaced by ъ in 1945, should be romanized ŭ
25
- - The obsolete character ѣ, replaced in 1945 by е or я according to local pronunciation, should be romanized as e or ya, accordingly, if the pronunciation is known; otherwise, as ye
26
- - The character sequence тс may be romanized t·s in order to differentiate that romanization from the regularly occurring digraph ts, which represents the character ц
27
-
28
- tests:
29
- - source: София
30
- expected: Sofiya
31
- - source: София-Град
32
- expected: Sofiya-Grad
33
- - source: България
34
- expected: "Bu\u0306lgariya"
35
-
36
- map:
37
- rules:
38
- # note[1]
39
- - pattern: (?<=)\u042a(?=\b)
40
- result: ""
41
- - pattern: (?<=)\u044a(?=\b)
42
- result: ""
43
- # note[4]
44
- - pattern: "\u0422\u0421"
45
- result: T·S
46
- - pattern: "\u0422\u0441"
47
- result: T·s
48
- - pattern: "\u0442\u0441"
49
- result: t·s
50
-
51
- characters:
52
- '\u0410': 'A'
53
- '\u0411': 'B'
54
- '\u0412': 'V'
55
- '\u0413': 'G'
56
- '\u0414': 'D'
57
- '\u0415': 'E'
58
- '\u0416': 'Zh'
59
- '\u0417': 'Z'
60
- '\u0418': 'I'
61
- '\u0419': 'Y'
62
- '\u041a': 'K'
63
- '\u041b': 'L'
64
- '\u041c': 'M'
65
- '\u041d': 'N'
66
- '\u041e': 'O'
67
- '\u041f': 'P'
68
- '\u0420': 'R'
69
- '\u0421': 'S'
70
- '\u0422': 'T'
71
- '\u0423': 'U'
72
- '\u0424': 'F'
73
- '\u0425': 'Kh'
74
- '\u0426': 'Ts'
75
- '\u0427': 'Ch'
76
- '\u0428': 'Sh'
77
- '\u0429': 'Sht'
78
- '\u042a': "U\u0306"
79
- '\u042c': "\\'"
80
- '\u042e': 'Yu'
81
- '\u042f': 'Ya'
82
- '\u0430': 'a'
83
- '\u0431': 'b'
84
- '\u0432': 'v'
85
- '\u0433': 'g'
86
- '\u0434': 'd'
87
- '\u0435': 'e'
88
- '\u0436': 'zh'
89
- '\u0437': 'z'
90
- '\u0438': 'i'
91
- '\u0439': 'y'
92
- '\u043a': 'k'
93
- '\u043b': 'l'
94
- '\u043c': 'm'
95
- '\u043d': 'n'
96
- '\u043e': 'o'
97
- '\u043f': 'p'
98
- '\u0440': 'r'
99
- '\u0441': 's'
100
- '\u0442': 't'
101
- '\u0443': 'u'
102
- '\u0444': 'f'
103
- '\u0445': 'kh'
104
- '\u0446': 'ts'
105
- '\u0447': 'ch'
106
- '\u0448': 'sh'
107
- '\u0449': 'sht'
108
- '\u044a': "u\u0306"
109
- '\u044c': "\\'"
110
- '\u044e': 'yu'
111
- '\u044f': 'ya'
112
-
113
- # note 2
114
- '\u046A': "U\u0306" # Ѫ
115
- '\u046B': "u\u0306" # ѫ
116
-
117
- # note[3]
118
- '\u0462': "Ye" # Ѣ
119
- '\u0463': "ye" # ѣ
@@ -1,42 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 2013
4
- language: iso-639-2:bul
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: BGN/PCGN 2013 Agreement
8
- alias:
9
- ogc11122:
10
- code: bul_Cyrl2Latn_BGN_2013
11
- description: Bulgarian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names(PCGN) Bulgarian 2013 System
12
- url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811509/ROMANIZATION_OF_BULGARIAN.pdf
13
- creation_date: 2013
14
- confirmation date: 2019-06
15
- description: |
16
- This system reflects the Bulgarian national system officially adopted
17
- by state decree in March 2009. It was adopted by BGN and PCGN in 2013,
18
- replacing the BGN/PCGN system of 1952.
19
-
20
- notes:
21
- - When in final position, “ия” is romanized as “ia” (e.g., София = Sofia; София-Град= Sofia-Grad).
22
- - An exception to the romanization system is allowed for the name of the state. Thus, България is romanized as Bulgaria.
23
- - The Romanization column shows only lowercase forms but, when romanizing, uppercase and lowercase Roman letters as appropriate should be used.
24
-
25
- tests:
26
- - source: София
27
- expected: Sofia
28
- - source: София-Град
29
- expected: Sofia-Grad
30
- - source: България
31
- expected: Bulgaria
32
-
33
- map:
34
- inherit: bgnpcgn-bul-Cyrl-Latn-1952
35
-
36
- rules:
37
- - pattern: България
38
- result: Bulgaria
39
- - pattern: (?<=\u0418)\u042f(?=\b) # final position, “ИЯ” is romanized as “IA”
40
- result: A
41
- - pattern: (?<=\u0438)\u044f(?=\b) # final position, “ия” is romanized as “ia”
42
- result: a