interscript 0.1.7 → 2.1.0b1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +116 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +83 -133
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +68 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +68 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +76 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +68 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/lib/interscript/visualize.rb +61 -0
  63. data/lib/interscript/visualize/group.html.erb +59 -0
  64. data/lib/interscript/visualize/json.rb +57 -0
  65. data/lib/interscript/visualize/map.html.erb +46 -0
  66. data/lib/interscript/visualize/nodes.rb +89 -0
  67. data/requirements.txt +1 -0
  68. metadata +78 -416
  69. data/README.adoc +0 -298
  70. data/lib/g2pwrapper.py +0 -34
  71. data/lib/interscript/fs.rb +0 -69
  72. data/lib/interscript/mapping.rb +0 -142
  73. data/lib/interscript/opal.rb +0 -57
  74. data/lib/interscript/opal/entrypoint.rb +0 -12
  75. data/lib/interscript/opal/map_translate.rb +0 -7
  76. data/lib/interscript/opal/maps.js.erb +0 -10
  77. data/lib/model-7 +0 -0
  78. data/lib/tha-pt-b-7 +0 -0
  79. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  80. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  81. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  82. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  83. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
  84. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
  85. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  86. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  87. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  88. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  89. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  90. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  91. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  92. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  93. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
  94. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
  95. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  96. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  97. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  98. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  99. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  100. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  101. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  102. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  103. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  104. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  105. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  106. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  107. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  108. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  109. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  110. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  111. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  112. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
  113. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  114. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  115. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  116. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  117. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  118. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  119. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  120. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  121. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  122. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  123. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  124. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  125. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  126. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  127. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  128. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  129. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  130. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
  131. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  132. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  133. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  134. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  135. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  136. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  137. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  138. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  139. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  140. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  141. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  142. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  143. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  144. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  145. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  146. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  147. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  148. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  149. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  150. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  151. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
  152. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
  153. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  154. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  155. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  156. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  157. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  158. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  159. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  160. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  161. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  162. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  163. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  164. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  165. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  166. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  167. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  168. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  169. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  170. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  171. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  172. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  173. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  174. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  175. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  176. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  177. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  178. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  179. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  180. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  181. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  182. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  183. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  184. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  185. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  186. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  187. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  188. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  189. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  190. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  191. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  192. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  193. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  194. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  195. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  196. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  197. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  198. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  199. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  200. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  201. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  202. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  203. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  204. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  205. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  206. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  207. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  208. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  209. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  210. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  211. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  212. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  213. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
  214. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  215. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  216. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  217. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  218. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  219. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  220. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  221. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  222. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  223. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  224. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  225. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  226. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  227. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  228. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  229. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  230. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  231. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  232. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  233. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  234. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  235. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  236. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  237. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  238. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  239. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  240. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  241. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  242. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  243. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  244. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
  245. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  246. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  247. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  248. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  249. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  250. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  251. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  252. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  253. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  254. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  255. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  256. data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
  257. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  258. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  259. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  260. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  261. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  262. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  263. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  264. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  265. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  266. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  267. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  268. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  269. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  270. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  271. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  272. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  273. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  274. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  275. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  276. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  277. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  278. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  279. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  280. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  281. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  282. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  283. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  284. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  285. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  286. data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
  287. data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
  288. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  289. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  290. data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
  291. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  292. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  293. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  294. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  295. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  296. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  297. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  298. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  299. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  300. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  301. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  302. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  303. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  304. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  305. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  306. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  307. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  308. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  309. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  310. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  311. data/spec/interscript/filenames_spec.rb +0 -384
  312. data/spec/interscript/mapping_spec.rb +0 -42
  313. data/spec/interscript_spec.rb +0 -29
  314. data/spec/spec_helper.rb +0 -3
@@ -1,411 +0,0 @@
1
- ---
2
- authority_id: mext
3
- id: 1954
4
- language: iso-639-2:jpn
5
- source_script: Hrkt
6
- destination_script: Latn
7
- name: 内閣告示第一号 -- ローマ字のつづり方
8
- url: http://www.mext.go.jp/b_menu/hakusho/nc/k19541209001/k19541209001.html
9
- creation_date: 1954
10
- adoption_date: 1954-12-09 # 昭和二十九年十二月九日
11
- description:
12
- jp: |
13
- 国語を書き表わす場合に用いるローマ字のつづり方を次のように定める。
14
-
15
- まえがき
16
- 1 一般に国語を書き表わす場合は、第1表に掲げたつづり方によるものとする。
17
- 2 国際的関係その他従来の慣例をにわかに改めがたい事情にある場合に限り、第2表に掲げたつづり方によつてもさしつかえない。
18
- 3 前二項のいずれの場合においても、おおむねそえがきを適用する。
19
- en: |
20
- The spelling method for Roman characters used when writing Japanese language is as follows.
21
-
22
- Preface
23
- 1. In general, when the language is written, the spelling shown in Table 1 shall be used.
24
- 2. The spelling methods listed in Table 2 can be used only when there is a situation that is difficult to change due to international relations or other conventional practices.
25
- 3. In either case of the preceding two paragraphs, the general introduction will apply.
26
-
27
- notes:
28
- - jp: はねる音「ン」はすべてnと書く。
29
- en: ン / ん is romanized always n in Kunrei-siki
30
- - jp: はねる音を表わすnと次にくる母音字またはyとを切り離す必要がある場合には、nの次に’を入れる。
31
- en: When it is necessary to separate the sound n from the vowel or y to follow, the apostrophe is added after the n.
32
- - jp: つまる音は、最初の子音字を重ねて表わす。
33
- en: The clogged sound is represented by overlapping the first consonant characters.
34
- - jp: 長音は母音字の上に^をつけて表わす。なお、大文字の場合は母音字を並べてもよい。
35
- en: Long vowels are expressed in Kunrei-siki by placing a circumflex (^) over a vowel. In the case of capital letters, vowel characters may be arranged.
36
- - jp: 特殊音の書き表わし方は自由とする。
37
- en: The way of writing special sounds is free.
38
- - jp: 文の書きはじめ、および固有名詞は語頭を大文字で書く。なお、固有名詞以外の名詞の語頭を大文字で書いてもよい。
39
- en: Begin writing sentences and proper nouns with capital letters. Note that the beginning of nouns other than proper nouns may be written in capital letters.
40
-
41
-
42
- tests:
43
- - source: かんおう
44
- expected: kan'ô
45
- - source: かのう
46
- expected: kanô
47
- - source: きんゆう
48
- expected: kin'yû
49
- - source: とうきょう
50
- expected: tôkyô
51
- - source: がっこう
52
- expected: gakkô
53
- - source: かごっま
54
- expected: kagomma
55
- - source: ぽっぽっや
56
- expected: poppoyya
57
- - source: てっら
58
- expected: terra
59
- - source: にゃっほー
60
- expected: nyahhô
61
- - source: ゴッホ
62
- expected: gohho
63
-
64
- map:
65
- rules:
66
- - pattern: "([んン])(?=[あいうえおやゆよアイウエオヤユヨ])"
67
- result: "\\1'"
68
-
69
- postrules:
70
- # Handling of っ/ッ
71
- #
72
- # The kana っ/ッ is a geminate marker.
73
- # When followed by a consonant, repeat the first letter of
74
- # the following syllable.
75
- #
76
- # If っ/ッ is not followed by a consonant, then it is usually
77
- # phonetically realised as an abrupt stop or shorterning of
78
- # the previous syllable. There is no documented or commonly
79
- # accepted way to transliterate this sound.
80
-
81
- - pattern: "[っッ]([BbCcDdFfGgHhJjKkLlMmNnPpQqRrSsTtVvWwXxYyZz])" # っ or ッ folloved by consonant
82
- result: "\\1\\1"
83
- - pattern: "[っッ]" # drop all other っッ.
84
- result: ""
85
-
86
- - pattern: "a[ーa]"
87
- result: "â"
88
- - pattern: "i[ーi]"
89
- result: "î"
90
- - pattern: "u[ーu]"
91
- result: "û"
92
- - pattern: "e[ーe]"
93
- result: "ê"
94
- - pattern: "o[ーo]"
95
- result: "ô"
96
-
97
- characters:
98
- "あ": "a"
99
- "い": "i"
100
- "う": "u"
101
- "え": "e"
102
- "お": "o"
103
-
104
- # Long vowels, note 4
105
- "おう": "ô"
106
-
107
-
108
- "か": "ka"
109
- "き": "ki"
110
- "く": "ku"
111
- "け": "ke"
112
- "こ": "ko"
113
- "きゃ": "kya"
114
- "きゅ": "kyu"
115
- "きょ": "kyo"
116
- "きょう": "kyô"
117
- "こう": "kô"
118
-
119
- "さ": "sa"
120
- "し": "si"
121
- "す": "su"
122
- "せ": "se"
123
- "そ": "so"
124
- "しゃ": "sya"
125
- "しゅ": "syu"
126
- "しょ": "syo"
127
- "しょう": "syô"
128
- "そう": "sô"
129
-
130
- "た": "ta"
131
- "ち": "ti"
132
- "つ": "tu"
133
- "て": "te"
134
- "と": "to"
135
- "ちゃ": "tya"
136
- "ちゅ": "tyu"
137
- "ちょ": "tyo"
138
- "ちょう": "tyô"
139
- "とう": "tô"
140
-
141
- "な": "na"
142
- "に": "ni"
143
- "ぬ": "nu"
144
- "ね": "ne"
145
- "の": "no"
146
- "にゃ": "nya"
147
- "にゅ": "nyu"
148
- "にょ": "nyo"
149
- "にょう": "nyô"
150
- "のう": "nô"
151
-
152
- "は": "ha"
153
- "ひ": "hi"
154
- "ふ": "hu"
155
- "へ": "he"
156
- "ほ": "ho"
157
- "ひゃ": "hya"
158
- "ひゅ": "hyu"
159
- "ひょ": "hyo"
160
- "ひょう": "hyô"
161
- "ほう": "hô"
162
-
163
- "ま": "ma"
164
- "み": "mi"
165
- "む": "mu"
166
- "め": "me"
167
- "も": "mo"
168
- "みゃ": "mya"
169
- "みゅ": "myu"
170
- "みょ": "myo"
171
- "みょう": "myô"
172
- "もう": "mô"
173
-
174
- "や": "ya"
175
- "ゆ": "yu"
176
- "よ": "yo"
177
- "よう": "yô"
178
-
179
- "ら": "ra"
180
- "り": "ri"
181
- "る": "ru"
182
- "れ": "re"
183
- "ろ": "ro"
184
- "りゃ": "rya"
185
- "りゅ": "ryu"
186
- "りょ": "ryo"
187
- "りょう": "ryô"
188
- "ろう": "rô"
189
-
190
- "わ": "wa"
191
- "を": "o"
192
-
193
- "が": "ga"
194
- "ぎ": "gi"
195
- "ぐ": "gu"
196
- "げ": "ge"
197
- "ご": "go"
198
- "ぎゃ": "gya"
199
- "ぎゅ": "gyu"
200
- "ぎょ": "gyo"
201
- "ぎゅう": "gyû"
202
- "ぎょう": "gyô"
203
- "ごう": "gô"
204
-
205
- "ざ": "za"
206
- "じ": "zi"
207
- "ず": "zu"
208
- "ぜ": "ze"
209
- "ぞ": "zo"
210
- "じゃ": "zya"
211
- "じゅ": "zyu"
212
- "じょ": "zyo"
213
- "じょう": "zyô"
214
- "ぞう": "zô"
215
-
216
-
217
- "だ": "da"
218
- "ぢ": "zi"
219
- "づ": "zu"
220
- "で": "de"
221
- "ど": "do"
222
- "ぢゃ": "zya"
223
- "ぢゅ": "zyu"
224
- "ぢょ": "zyo"
225
- "ぢょう": "zyô"
226
- "どう": "dô"
227
-
228
- "ば": "ba"
229
- "び": "bi"
230
- "ぶ": "bu"
231
- "べ": "be"
232
- "ぼ": "bo"
233
- "びゃ": "bya"
234
- "びゅ": "byu"
235
- "びょ": "byo"
236
- "びょう": "byô"
237
- "ぼう": "bô"
238
-
239
- "ぱ": "pa"
240
- "ぴ": "pi"
241
- "ぷ": "pu"
242
- "ぺ": "pe"
243
- "ぽ": "po"
244
- "ぴゃ": "pya"
245
- "ぴゅ": "pyu"
246
- "ぴょ": "pyo"
247
- "ぴょう": "pyô"
248
- "ぽう": "pô"
249
-
250
- "ん": "n" # See note 2
251
-
252
-
253
- # Note 3. つまる音は、最初の子音字を重ねて表わす。
254
- # Handled by postrules
255
-
256
- # Katakana
257
-
258
- "ア": "a"
259
- "イ": "i"
260
- "ウ": "u"
261
- "エ": "e"
262
- "オ": "o"
263
-
264
- # Long vowels, note 4
265
- "オウ": "ô"
266
-
267
- "カ": "ka"
268
- "キ": "ki"
269
- "ク": "ku"
270
- "ケ": "ke"
271
- "コ": "ko"
272
- "キャ": "kya"
273
- "キュ": "kyu"
274
- "キョ": "kyo"
275
- "キョウ": "kyô"
276
- "コウ": "kô"
277
-
278
- "サ": "sa"
279
- "シ": "si"
280
- "ス": "su"
281
- "セ": "se"
282
- "ソ": "so"
283
- "シャ": "sya"
284
- "シュ": "syu"
285
- "ショ": "syo"
286
- "ショウ": "syô"
287
- "ソウ": "sô"
288
-
289
- "タ": "ta"
290
- "チ": "ti"
291
- "ツ": "tu"
292
- "テ": "te"
293
- "ト": "to"
294
- "チャ": "tya"
295
- "チュ": "tyu"
296
- "チョ": "tyo"
297
- "チョウ": "tyô"
298
- "トウ": "tô"
299
-
300
- "ナ": "na"
301
- "ニ": "ni"
302
- "ヌ": "nu"
303
- "ネ": "ne"
304
- "ノ": "no"
305
- "ニャ": "nya"
306
- "ニュ": "nyu"
307
- "ニョ": "nyo"
308
- "ニョウ": "nyô"
309
- "ノウ": "nô"
310
-
311
- "ハ": "ha"
312
- "ヒ": "hi"
313
- "フ": "hu"
314
- "ヘ": "he"
315
- "ホ": "ho"
316
- "ヒャ": "hya"
317
- "ヒュ": "hyu"
318
- "ヒョ": "hyo"
319
- "ヒョウ": "hyô"
320
- "ホウ": "hô"
321
-
322
- "マ": "ma"
323
- "ミ": "mi"
324
- "ム": "mu"
325
- "メ": "me"
326
- "モ": "mo"
327
- "ミャ": "mya"
328
- "ミュ": "myu"
329
- "ミョ": "myo"
330
- "ミョウ": "myô"
331
- "モウ": "mô"
332
-
333
- "ヤ": "ya"
334
- "ユ": "yu"
335
- "ヨ": "yo"
336
- "ヨウ": "yô"
337
-
338
- "ラ": "ra"
339
- "リ": "ri"
340
- "ル": "ru"
341
- "レ": "re"
342
- "ロ": "ro"
343
- "リャ": "rya"
344
- "リュ": "ryu"
345
- "リョ": "ryo"
346
- "リョウ": "ryô"
347
- "ロウ": "rô"
348
-
349
- "ワ": "wa"
350
- "ヲ": "o"
351
-
352
- "ガ": "ga"
353
- "ギ": "gi"
354
- "グ": "gu"
355
- "ゲ": "ge"
356
- "ゴ": "go"
357
- "ギャ": "gya"
358
- "ギュ": "gyu"
359
- "ギョ": "gyo"
360
- "ギョウ": "gyô"
361
- "ゴウ": "gô"
362
-
363
- "ザ": "za"
364
- "ジ": "zi"
365
- "ズ": "zu"
366
- "ゼ": "ze"
367
- "ゾ": "zo"
368
- "ジャ": "zya"
369
- "ジュ": "zyu"
370
- "ジョ": "zyo"
371
- "ジョウ": "zyô"
372
- "ゾウ": "zô"
373
-
374
- "ダ": "da"
375
- "ヂ": "zi"
376
- "ヅ": "zu"
377
- "デ": "de"
378
- "ド": "do"
379
- "ヂャ": "zya"
380
- "ヂュ": "zyu"
381
- "ヂョ": "zyo"
382
- "ヂョウ": "zyô"
383
- "ドウ": "dô"
384
-
385
- "バ": "ba"
386
- "ビ": "bi"
387
- "ブ": "bu"
388
- "ベ": "be"
389
- "ボ": "bo"
390
- "ビャ": "bya"
391
- "ビュ": "byu"
392
- "ビョ": "byo"
393
- "ビョウ": "byô"
394
- "ボウ": "bô"
395
-
396
- "パ": "pa"
397
- "ピ": "pi"
398
- "プ": "pu"
399
- "ペ": "pe"
400
- "ポ": "po"
401
- "ピャ": "pya"
402
- "ピュ": "pyu"
403
- "ピョ": "pyo"
404
- "ピョウ": "pyô"
405
- "ポウ": "pô"
406
-
407
- "ン": "n" # See note 1
408
-
409
-
410
- # Note 3. つまる音は、最初の子音字を重ねて表わす。
411
- # Handled by postrules
@@ -1,163 +0,0 @@
1
- ---
2
- authority_id: mns
3
- id: 2012
4
- language: iso-639-2:mon
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: Transliteration of Mongolian Cyrillic characters into Latin
8
- url: http://estandard.gov.mn/standard/reader/4635
9
- creation_date:
10
- confirmation_date: 2012-02
11
- description: |
12
- The standard MNS 5217:2012 is a standard of the Mongolian Agency for Standardization and Metrology
13
- for transliteration from Cyrillic Mongolian in Latin alphabet. It repeats and supplements the previous
14
- standard dating from 2003 (MNS 5217:2003).
15
-
16
- This standard differs from the ISO 9 system for Cyrillic adopted by Russia, Armenia, Azerbaijan,
17
- Belarus, Kazakhstan, Kyrgyzstan, Uzbekistan, Tajikistan and Turkmenistan.
18
-
19
- tests:
20
- - source: Аварга, халбага, аав
21
- expected: Avarga, khalbaga, aav
22
- - source: Бага, самбар
23
- expected: Baga, sambar
24
- - source: Аварга, вагон, сав
25
- expected: Avarga, vagon, sav
26
- - source: Газар, гэрээ, хэрэг
27
- expected: Gazar, geree, khereg
28
- - source: Дадлага, ахмад
29
- expected: Dadlaga, akhmad
30
- - source: Еэвэн, ерөөл
31
- expected: Yeeven, yerööl
32
- - source: Ёроол, оёдол
33
- expected: Yorool, oyodol
34
- - source: Жуулчин, ажил, Жон
35
- expected: Juulchin, ajil, Jon
36
- - source: Зам, азарга, бааз
37
- expected: Zam, azarga, baaz
38
- - source: Кино, километр, академи
39
- expected: Kino, kilomyetr, akadyemi # Kino, kilometr, akademi - Provided sample is wrong
40
- - source: Ишиг, бичиг, хань
41
- expected: Ishig, bichig, khani
42
- - source: Ийм, ээжийн
43
- expected: Iim, eejiin
44
- - source: Лам, алаг, мал
45
- expected: Lam, alag, mal
46
- - source: Мал, хамар, нам
47
- expected: Mal, khamar, nam
48
- - source: Нар, хана, үнэн
49
- expected: Nar, khana, ünen
50
- - source: Орон, боловсрол, тооно
51
- expected: Oron, bolovsrol, toono
52
- - source: Өдөр, өнөөдөр, өөрөөсөө
53
- expected: Ödör, önöödör, ööröösöö
54
- - source: Пуужин, апарат
55
- expected: Puujin, aparat
56
- - source: Рашаан, радио, сар
57
- expected: Rashaan, radio, sar
58
- - source: Сар, асар, эцэс
59
- expected: Sar, asar, etses
60
- - source: Тамга, татлага
61
- expected: Tamga, tatlaga
62
- - source: Уран, нуруу
63
- expected: Uran, nuruu
64
- - source: Үнэн, түргэн, тэргүүн
65
- expected: Ünen, türgen, tergüün
66
- - source: Фото, фонд
67
- expected: Foto, fond
68
- - source: Хавар, нөхөр, эх
69
- expected: Khavar, nökhör, ekh
70
- - source: Цацаг, цэцэг
71
- expected: Tsatsag, tsetseg
72
- - source: Чимэг, чадал, ач
73
- expected: Chimeg, chadal, ach
74
- - source: Шашин, ааш
75
- expected: Shashin, aash
76
- - source: Щедрин, щорс
77
- expected: Shyedrin, shors # Shedrin, Shors - Provided sample is wrong
78
- - source: Оръё, суръя, гаръя
79
- expected: Oriyo, suriya, gariya
80
- - source: Хааны, ахын
81
- expected: Khaany, akhyn
82
- - source: Харь, барь
83
- expected: Khari, bari
84
- - source: Эзэн, энэ, эмээл
85
- expected: Ezen, ene, emeel
86
- - source: Юм, юүдэн
87
- expected: Yum, yuüden
88
- - source: Ямар, ядуу, ая
89
- expected: Yamar, yaduu, aya
90
-
91
- map:
92
-
93
- characters:
94
- "А": "A" # \u0410
95
- "Б": "B" # \u0411
96
- "В": "V" # \u0412
97
- "Г": "G" # \u0413
98
- "Д": "D" # \u0414
99
- "Е": "Ye" # \u0415
100
- "Ё": "Yo" # \u0401
101
- "Ж": "J" # \u0416
102
- "З": "Z" # \u0417
103
- "И": "I" # \u0418
104
- "Й": "I" # \u0419
105
- "К": "K" # \u041a
106
- "Л": "L" # \u041b
107
- "М": "M" # \u041c
108
- "Н": "N" # \u041d
109
- "О": "O" # \u041e
110
- "Ө": "Ö" # \u04e8
111
- "П": "P" # \u041f
112
- "Р": "R" # \u0420
113
- "С": "S" # \u0421
114
- "Т": "T" # \u0422
115
- "У": "U" # \u0423
116
- "Ү": "Ü" # \u04ae
117
- "Ф": "F" # \u0424
118
- "Х": "Kh" # \u0425
119
- "Ц": "Ts" # \u0426
120
- "Ч": "Ch" # \u0427
121
- "Ш": "Sh" # \u0428
122
- "Щ": "Sh" # \u0429
123
- "Ъ": "I" # \u042a
124
- "Ы": "Y" # \u042b
125
- "Ь": "I" # \u042c
126
- "Э": "E" # \u042d
127
- "Ю": "Yu" # \u042e
128
- "Я": "Ya" # \u042f
129
- "а": "a" # \u0430
130
- "б": "b" # \u0431
131
- "в": "v" # \u0432
132
- "г": "g" # \u0433
133
- "д": "d" # \u0434
134
- "е": "ye" # \u0435
135
- "ё": "yo" # \u0451
136
- "ж": "j" # \u0436
137
- "з": "z" # \u0437
138
- "и": "i" # \u0438
139
- "й": "i" # \u0439
140
- "к": "k" # \u043a
141
- "л": "l" # \u043b
142
- "м": "m" # \u043c
143
- "н": "n" # \u043d
144
- "о": "o" # \u043e
145
- "ө": "ö" # \u04e9
146
- "п": "p" # \u043f
147
- "р": "r" # \u0440
148
- "с": "s" # \u0441
149
- "т": "t" # \u0442
150
- "у": "u" # \u0443
151
- "ү": "ü" # \u04af
152
- "ф": "f" # \u0444
153
- "х": "kh" # \u0445
154
- "ц": "ts" # \u0446
155
- "ч": "ch" # \u0447
156
- "ш": "sh" # \u0448
157
- "щ": "sh" # \u0449
158
- "ъ": "i" # \u044a
159
- "ы": "y" # \u044b
160
- "ь": "i" # \u044c
161
- "э": "e" # \u044d
162
- "ю": "yu" # \u044e
163
- "я": "ya" # \u044f