interscript 0.1.7 → 2.1.0b1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +116 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +83 -133
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +68 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +68 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +76 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +68 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/lib/interscript/visualize.rb +61 -0
  63. data/lib/interscript/visualize/group.html.erb +59 -0
  64. data/lib/interscript/visualize/json.rb +57 -0
  65. data/lib/interscript/visualize/map.html.erb +46 -0
  66. data/lib/interscript/visualize/nodes.rb +89 -0
  67. data/requirements.txt +1 -0
  68. metadata +78 -416
  69. data/README.adoc +0 -298
  70. data/lib/g2pwrapper.py +0 -34
  71. data/lib/interscript/fs.rb +0 -69
  72. data/lib/interscript/mapping.rb +0 -142
  73. data/lib/interscript/opal.rb +0 -57
  74. data/lib/interscript/opal/entrypoint.rb +0 -12
  75. data/lib/interscript/opal/map_translate.rb +0 -7
  76. data/lib/interscript/opal/maps.js.erb +0 -10
  77. data/lib/model-7 +0 -0
  78. data/lib/tha-pt-b-7 +0 -0
  79. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  80. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  81. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  82. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  83. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
  84. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
  85. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  86. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  87. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  88. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  89. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  90. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  91. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  92. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  93. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
  94. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
  95. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  96. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  97. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  98. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  99. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  100. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  101. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  102. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  103. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  104. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  105. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  106. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  107. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  108. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  109. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  110. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  111. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  112. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
  113. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  114. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  115. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  116. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  117. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  118. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  119. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  120. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  121. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  122. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  123. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  124. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  125. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  126. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  127. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  128. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  129. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  130. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
  131. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  132. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  133. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  134. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  135. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  136. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  137. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  138. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  139. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  140. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  141. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  142. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  143. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  144. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  145. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  146. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  147. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  148. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  149. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  150. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  151. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
  152. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
  153. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  154. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  155. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  156. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  157. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  158. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  159. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  160. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  161. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  162. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  163. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  164. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  165. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  166. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  167. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  168. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  169. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  170. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  171. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  172. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  173. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  174. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  175. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  176. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  177. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  178. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  179. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  180. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  181. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  182. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  183. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  184. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  185. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  186. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  187. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  188. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  189. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  190. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  191. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  192. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  193. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  194. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  195. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  196. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  197. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  198. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  199. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  200. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  201. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  202. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  203. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  204. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  205. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  206. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  207. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  208. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  209. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  210. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  211. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  212. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  213. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
  214. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  215. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  216. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  217. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  218. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  219. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  220. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  221. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  222. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  223. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  224. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  225. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  226. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  227. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  228. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  229. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  230. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  231. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  232. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  233. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  234. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  235. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  236. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  237. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  238. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  239. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  240. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  241. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  242. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  243. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  244. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
  245. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  246. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  247. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  248. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  249. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  250. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  251. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  252. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  253. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  254. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  255. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  256. data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
  257. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  258. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  259. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  260. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  261. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  262. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  263. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  264. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  265. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  266. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  267. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  268. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  269. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  270. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  271. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  272. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  273. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  274. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  275. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  276. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  277. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  278. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  279. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  280. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  281. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  282. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  283. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  284. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  285. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  286. data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
  287. data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
  288. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  289. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  290. data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
  291. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  292. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  293. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  294. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  295. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  296. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  297. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  298. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  299. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  300. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  301. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  302. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  303. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  304. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  305. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  306. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  307. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  308. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  309. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  310. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  311. data/spec/interscript/filenames_spec.rb +0 -384
  312. data/spec/interscript/mapping_spec.rb +0 -42
  313. data/spec/interscript_spec.rb +0 -29
  314. data/spec/spec_helper.rb +0 -3
@@ -1,144 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2012
4
- language: iso-639-2:pli
5
- source_script: Deva
6
- destination_script: Latn
7
- name: Pali Romanization, 2012
8
- url: https://www.loc.gov/catdir/cpso/romanization/pali.pdf
9
- creation_date: 2012
10
- description: |
11
- ALA-LC Romanization table for Pali
12
-
13
- notes:
14
-
15
- - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
- vowels following a consonant can be found in grammars; no distinction between the two is
17
- made in transliteration.
18
-
19
- - |
20
- The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
- transliteration, with the following exceptions:
22
-
23
- a) when another vowel is indicated by its appropriate sign; and
24
- b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
25
- virāma.
26
-
27
- - |
28
- Exception: Niggahīta combinations representing nasals are romanized by ṅ
29
- before gutturals, ñ before palatals, ṇ before cerebrals, n before dentals, and m before
30
- labials.
31
-
32
- tests:
33
- - source: "तेन खो पन समयेन वेसालिया अविदूरे कलन्दगामो नाम अत्थि"
34
- expected: "taena khao pana samayaena vaesaālaiyaā avaidaūrae kalanadagaāmao naāma atathai"
35
- - source: "तत्थ सुदिन्‍नो नाम कलन्दपुत्तो सेट्ठिपुत्तो होति"
36
- expected: "tatatha saudainanao naāma kalanadapautatao saeṭaṭhaipautatao haotai"
37
- - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो सम्बहुलेहि"
38
- expected: "atha khao saudainanao kalanadapautatao samabahaulaehai"
39
- - source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
40
- expected: "tathaā cataurabhaiḥ paurauṣaḥ paraīkaṣayatae tayaāgaena śaīlaena gauṇaena karamaṇaā"
41
- - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो अचिरवुट्ठिताय परिसाय येन भगवा तेनुपसङ्कमि; उपसङ्कमित्वा भगवन्तं अभिवादेत्वा एकमन्तं निसीदि"
42
- expected: "atha khao saudainanao kalanadapautatao acairavauṭaṭhaitaāya paraisaāya yaena bhagavaā taenaupasaṅakamai; upasaṅakamaitavaā bhagavanataṃ abhaivaādaetavaā ekamanataṃ naisaīdai"
43
- - source: "अथ खो सुदिन्‍नस्स कलन्दपुत्तस्स मातापितरो सुदिन्‍नं कलन्दपुत्तं एतदवोचुं"
44
- expected: "atha khao saudainanasasa kalanadapautatasasa maātaāpaitarao saudainanaṃ kalanadapautataṃ etadavaocauṃ"
45
- - source: "त्वं खोसि, तात सुदिन्‍न, अम्हाकं एकपुत्तको पियो मनापो सुखेधितो सुखपरिहतो"
46
- expected: "tavaṃ khaosai, taāta saudainana, amahaākaṃ ekapautatakao paiyao manaāpao saukhaedhaitao saukhaparaihatao"
47
- - source: "न त्वं, तात सुदिन्‍न, किञ्‍चि दुक्खस्स जानासि"
48
- expected: "na tavaṃ, taāta saudainana, kaiñacai daukakhasasa jaānaāsai"
49
- - source: "अनुञ्‍ञातोम्हि किर मातापितूहि अगारस्मा अनगारियं पब्बज्‍जाया’’ति, हट्ठो उदग्गो पाणिना गत्तानि परिपुञ्छन्तो वुट्ठासि"
50
- expected: "anauñañaātaomahai kaira maātaāpaitaūhai agaārasamaā anagaāraiyaṃ pababajajaāyaā’’tai, haṭaṭhao udagagao paāṇainaā gatataānai paraipauñachanatao vauṭaṭhaāsai"
51
-
52
- map:
53
-
54
- rules:
55
- # note[3]
56
- - pattern: \u0902(?=[कखगघङ])
57
- result: ṅ
58
- - pattern: \u0902(?=[चछजझञ])
59
- result: ñ
60
- - pattern: \u0902(?=[टठडढण])
61
- result: ṇ
62
- - pattern: \u0902(?=[तथदधन])
63
- result: n
64
-
65
- characters:
66
-
67
- # I. Vowels and Diphthongs (see Note 1)
68
-
69
- 'अ': 'a'
70
- 'आ': 'ā'
71
- 'इ': 'i'
72
- 'ई': 'ī'
73
- 'उ': 'u'
74
- 'ऊ': 'ū'
75
- 'ए': 'e'
76
- 'ओ': 'o'
77
-
78
- # II. Consonants (see Note 2)
79
- # Gutturals
80
- 'क': 'ka'
81
- 'ख': 'kha'
82
- 'ग': 'ga'
83
- 'घ': 'gha'
84
- 'ङ': 'ṅa'
85
-
86
- # Palatals
87
- 'च': 'ca'
88
- 'छ': 'cha'
89
- 'ज': 'ja'
90
- 'झ': 'jha'
91
- 'ञ': 'ña'
92
-
93
- # Cerebrals
94
- 'ट': 'ṭa'
95
- 'ठ': 'ṭha'
96
- 'ड': 'ḍa'
97
- 'ढ': 'ḍha'
98
- 'ण': 'ṇa'
99
-
100
- # Dentals
101
- 'त': 'ta'
102
- 'थ': 'tha'
103
- 'द': 'da'
104
- 'ध': 'dha'
105
- 'न': 'na'
106
-
107
- # Labials
108
- 'प': 'pa'
109
- 'फ': 'pha'
110
- 'ब': 'ba'
111
- 'भ': 'bha'
112
- 'म': 'ma'
113
-
114
- # Semivowels
115
- 'य': 'ya'
116
- 'र': 'ra'
117
- 'ल': 'la'
118
- 'ळ': 'ḻa'
119
- 'व': 'va'
120
-
121
- # Sibilants
122
- 'श': 'śa'
123
- 'ष': 'ṣa'
124
- 'स': 'sa'
125
-
126
- # Aspirate
127
- 'ह': 'ha'
128
-
129
- # Visagga
130
- 'ः': 'ḥ'
131
-
132
- # Niggahīta/Anusvāra
133
- 'ं': 'ṃ'
134
-
135
- # Medials # Needed for connecting constants
136
- 'ा': "ā"
137
- 'ि': "i"
138
- 'ी': "ī"
139
- 'ु': "u"
140
- 'ू': "ū"
141
- 'े': "e"
142
- 'ो': "o"
143
- '्': ""
144
- '‍': ''# Used for joining
@@ -1,47 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2012
4
- language: iso-639-2:pra
5
- source_script: Deva
6
- destination_script: Latn
7
- name: Prakrit Romanization, 2012
8
- url: https://www.loc.gov/catdir/cpso/romanization/sanskrit.pdf
9
- creation_date: 2012
10
- description: |
11
- ALA-LC Romanization table for Prakrit
12
-
13
- notes:
14
-
15
- - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
- vowels following a consonant can be found in grammars; no distinction between the two is
17
- made in transliteration.
18
-
19
- - |
20
- The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
- transliteration, with the following exceptions:
22
-
23
- a) when another vowel is indicated by its appropriate sign; and
24
- b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
25
- virāma.
26
-
27
- - |
28
- Exception: Anusvāra is transliterated by:
29
-
30
- a) ṅ before gutturals,
31
- b) ñ before palatals,
32
- c) ṇ before cerebrals,
33
- d) n before dentals, and
34
- e) m before labials.
35
- In other circumstances it is transliterated by a tilde (~) over the vowel.
36
-
37
- - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
38
-
39
- tests:
40
- - source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
41
- expected: "saṛṣaṭaisathaitaivainaāśaānaāṃ śakataibhaūtae sanaātanai"
42
- - source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
43
- expected: "gauṇaāśarayae gauṇamayae naāraāyaṇai namao’satau tae"
44
-
45
- map:
46
-
47
- inherit: "alalc-san-Deva-Latn-2012"
@@ -1,225 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 1997
4
- language: iso-639-2:rus
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: ALA-LC Romanization System 1997
8
- alias:
9
- ogc11122:
10
- code: rus_Cyrl2Latn_ALA_1997
11
- description: Russian ALA-Library of Congress 1997 System
12
- url: https://en.wikipedia.org/wiki/ALA-LC_romanization_for_Russian
13
- creation_date: 1997
14
- description: |
15
- The ALA-LC Romanization tables for Slavic alphabets is a set of standards for romanization of texts
16
- in various writing systems used in North American libraries and publications.
17
- This version was published by the American Library Association and the Library of Congress in 1997.
18
- This article is about the ALA-LC method of transliteration of Russian-language text from Cyrillic script to Latin script.
19
-
20
- The formal, unambiguous version of the system requires some diacritics and two-letter tie characters which are often omitted in practice.
21
-
22
- notes:
23
- - Pre-1918 letters skipped
24
- - Pre-18th century letters skipped
25
-
26
- tests:
27
- - source: Азов
28
- expected: Azov
29
- - source: Тамбов
30
- expected: Tambov
31
- - source: Барнаул
32
- expected: Barnaul
33
- - source: Кубань
34
- expected: Kubanʹ
35
- - source: Владимир
36
- expected: Vladimir
37
- - source: Ульяновск
38
- expected: Ulʹi͡anovsk
39
- - source: Грозный
40
- expected: Groznyǐ
41
- - source: Волгодонск
42
- expected: Volgodonsk
43
- - source: Дзержинский
44
- expected: Dzerzhinskiǐ
45
- - source: Нелидово
46
- expected: Nelidovo
47
- - source: Елизово
48
- expected: Elizovo
49
- - source: Чебоксары
50
- expected: Cheboksary
51
- - source: Ёлкин
52
- expected: Ëlkin
53
- - source: Озёрный
54
- expected: Ozërnyǐ
55
- - source: Жуков
56
- expected: Zhukov
57
- - source: Лужники
58
- expected: Luzhniki
59
- - source: Звенигород
60
- expected: Zvenigorod
61
- - source: Вязьма
62
- expected: Vi͡azʹma
63
- - source: Иркутск
64
- expected: Irkutsk
65
- - source: Апатиты
66
- expected: Apatity
67
- - source: Йошкар-Ола
68
- expected: Ǐoshkar-Ola
69
- - source: Бийск
70
- expected: Biǐsk
71
- - source: Киров
72
- expected: Kirov
73
- - source: Енисейск
74
- expected: Eniseǐsk
75
- - source: Ломоносов
76
- expected: Lomonosov
77
- - source: Нелидово
78
- expected: Nelidovo
79
- - source: Менделеев
80
- expected: Mendeleev
81
- - source: Каменка
82
- expected: Kamenka
83
- - source: Новосибирск
84
- expected: Novosibirsk
85
- - source: Кандалакша
86
- expected: Kandalaksha
87
- - source: Омск
88
- expected: Omsk
89
- - source: Красноярск
90
- expected: Krasnoi͡arsk
91
- - source: Петрозаводск
92
- expected: Petrozavodsk
93
- - source: Серпухов
94
- expected: Serpukhov
95
- - source: Ростов
96
- expected: Rostov
97
- - source: Северобайкальск
98
- expected: Severobaǐkalʹsk
99
- - source: Сковородино
100
- expected: Skovorodino
101
- - source: Чайковский
102
- expected: Chaǐkovskiǐ
103
- - source: Тамбов
104
- expected: Tambov
105
- - source: Мытищи
106
- expected: Mytishchi
107
- - source: Углич
108
- expected: Uglich
109
- - source: Дудинка
110
- expected: Dudinka
111
- - source: Фурманов
112
- expected: Furmanov
113
- - source: Уфа
114
- expected: Ufa
115
- - source: Хабаровск
116
- expected: Khabarovsk
117
- - source: Прохладный
118
- expected: Prokhladnyǐ
119
- - source: Цимлянск
120
- expected: T͡Simli͡ansk
121
- - source: Ельцин
122
- expected: Elʹt͡sin
123
- - source: Чебоксары
124
- expected: Cheboksary
125
- - source: Печора
126
- expected: Pechora
127
- - source: Шахтёрск
128
- expected: Shakhtërsk
129
- - source: Мышкин
130
- expected: Myshkin
131
- - source: Щёлково
132
- expected: Shchëlkovo
133
- - source: Ртищево
134
- expected: Rtishchevo
135
- - source: Подъездной
136
- expected: Podʺezdnoǐ
137
- - source: Ыттык-Кёль
138
- expected: Yttyk-Këlʹ
139
- - source: Тында
140
- expected: Tynda
141
- - source: Тюмень
142
- expected: Ti͡umenʹ
143
- - source: Электрогорск
144
- expected: Ėlektrogorsk
145
- - source: Радиоэлектроника
146
- expected: Radioėlektronika
147
- - source: Юбилейный
148
- expected: I͡Ubileǐnyǐ
149
- - source: Ключевская
150
- expected: Kli͡uchevskai͡a
151
- - source: Якутск
152
- expected: I͡Akutsk
153
- - source: Брянск
154
- expected: Bri͡ansk
155
-
156
- map:
157
- characters:
158
- "\u0027": "" # '
159
- "\u0410": "A" # А
160
- "\u0411": "B" # Б
161
- "\u0412": "V" # В
162
- "\u0413": "G" # Г
163
- "\u0414": "D" # Д
164
- "\u0415": "E" # Е
165
- "\u0401": "Ë" # Ё
166
- "\u0416": "Zh" # Ж
167
- "\u0417": "Z" # З
168
- "\u0418": "I" # И
169
- "\u0419": "\u01CF" # Й
170
- "\u041A": "K" # К
171
- "\u041B": "L" # Л
172
- "\u041C": "M" # М
173
- "\u041D": "N" # Н
174
- "\u041E": "O" # О
175
- "\u041F": "P" # П
176
- "\u0420": "R" # Р
177
- "\u0421": "S" # С
178
- "\u0422": "T" # Т
179
- "\u0423": "U" # У
180
- "\u0424": "F" # Ф
181
- "\u0425": "Kh" # Х
182
- "\u0426": "T\u0361S" # Ц
183
- "\u0427": "Ch" # Ч
184
- "\u0428": "Sh" # Ш
185
- "\u0429": "Shch" # Щ
186
- "\u042A": "ʺ" # Ъ
187
- "\u042B": "Y" # Ы
188
- "\u042C": "ʹ" # Ь
189
- "\u042D": "E\u0307" # Э
190
- "\u042E": "I\u0361U" # Ю
191
- "\u042F": "I\u0361A" # Я
192
-
193
- "\u0430": "a" # а
194
- "\u0431": "b" # б
195
- "\u0432": "v" # в
196
- "\u0433": "g" # г
197
- "\u0434": "d" # д
198
- "\u0435": "e" # e
199
- "\u0451": "ë" # ё
200
- "\u0436": "zh" # ж
201
- "\u0437": "z" # з
202
- "\u0438": "i" # и
203
- "\u0439": "\u01d0" # й
204
- "\u043A": "k" # к
205
- "\u043B": "l" # л
206
- "\u043C": "m" # м
207
- "\u043D": "n" # н
208
- "\u043E": "o" # о
209
- "\u043F": "p" # п
210
- "\u0440": "r" # р
211
- "\u0441": "s" # с
212
- "\u0442": "t" # т
213
- "\u0443": "u" # у
214
- "\u0444": "f" # ф
215
- "\u0445": "kh" # х
216
- "\u0446": "t\u0361s" # ц
217
- "\u0447": "ch" # ч
218
- "\u0448": "sh" # ш
219
- "\u0449": "shch" # щ
220
- "\u044A": "ʺ" # ъ
221
- "\u044B": "y" # ы
222
- "\u044C": "ʹ" # ь
223
- "\u044D": "e\u0307" # э
224
- "\u044E": "i\u0361u" # ю
225
- "\u044F": "i\u0361a" # я
@@ -1,162 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2012
4
- language: iso-639-2:rus
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: ALA-LC Romanization System 2012
8
- url: https://www.loc.gov/catdir/cpso/romanization/russian.pdf
9
- creation_date: 2012
10
- description: |
11
- The ALA-LC Romanization tables for Slavic alphabets is a set of standards for romanization of texts
12
- in various writing systems used in North American libraries and publications.
13
- The latest version was published by the American Library Association and the Library of Congress in 2012.
14
-
15
- notes:
16
- - The letters І, Ѣ, Ѳ and Ѵ were eliminated in the orthographic reform of 1918. For other obsolete letters appearing in Russian texts, consult the Church Slavic table.
17
-
18
- tests:
19
- - source: Азов
20
- expected: Azov
21
- - source: Тамбов
22
- expected: Tambov
23
- - source: Барнаул
24
- expected: Barnaul
25
- - source: Кубань
26
- expected: Kubanʹ
27
- - source: Владимир
28
- expected: Vladimir
29
- - source: Ульяновск
30
- expected: Ulʹi͡anovsk
31
- - source: Грозный
32
- expected: Groznyǐ
33
- - source: Волгодонск
34
- expected: Volgodonsk
35
- - source: Дзержинский
36
- expected: Dzerzhinskiǐ
37
- - source: Нелидово
38
- expected: Nelidovo
39
- - source: Елизово
40
- expected: Elizovo
41
- - source: Чебоксары
42
- expected: Cheboksary
43
- - source: Ёлкин
44
- expected: Ëlkin
45
- - source: Озёрный
46
- expected: Ozërnyǐ
47
- - source: Жуков
48
- expected: Zhukov
49
- - source: Лужники
50
- expected: Luzhniki
51
- - source: Звенигород
52
- expected: Zvenigorod
53
- - source: Вязьма
54
- expected: Vi͡azʹma
55
- - source: Иркутск
56
- expected: Irkutsk
57
- - source: Апатиты
58
- expected: Apatity
59
- - source: Йошкар-Ола
60
- expected: Ǐoshkar-Ola
61
- - source: Бийск
62
- expected: Biǐsk
63
- - source: Киров
64
- expected: Kirov
65
- - source: Енисейск
66
- expected: Eniseǐsk
67
- - source: Ломоносов
68
- expected: Lomonosov
69
- - source: Нелидово
70
- expected: Nelidovo
71
- - source: Менделеев
72
- expected: Mendeleev
73
- - source: Каменка
74
- expected: Kamenka
75
- - source: Новосибирск
76
- expected: Novosibirsk
77
- - source: Кандалакша
78
- expected: Kandalaksha
79
- - source: Омск
80
- expected: Omsk
81
- - source: Красноярск
82
- expected: Krasnoi͡arsk
83
- - source: Петрозаводск
84
- expected: Petrozavodsk
85
- - source: Серпухов
86
- expected: Serpukhov
87
- - source: Ростов
88
- expected: Rostov
89
- - source: Северобайкальск
90
- expected: Severobaǐkalʹsk
91
- - source: Сковородино
92
- expected: Skovorodino
93
- - source: Чайковский
94
- expected: Chaǐkovskiǐ
95
- - source: Тамбов
96
- expected: Tambov
97
- - source: Мытищи
98
- expected: Mytishchi
99
- - source: Углич
100
- expected: Uglich
101
- - source: Дудинка
102
- expected: Dudinka
103
- - source: Фурманов
104
- expected: Furmanov
105
- - source: Уфа
106
- expected: Ufa
107
- - source: Хабаровск
108
- expected: Khabarovsk
109
- - source: Прохладный
110
- expected: Prokhladnyǐ
111
- - source: Цимлянск
112
- expected: T͡Simli͡ansk
113
- - source: Ельцин
114
- expected: Elʹt͡sin
115
- - source: Чебоксары
116
- expected: Cheboksary
117
- - source: Печора
118
- expected: Pechora
119
- - source: Шахтёрск
120
- expected: Shakhtërsk
121
- - source: Мышкин
122
- expected: Myshkin
123
- - source: Щёлково
124
- expected: Shchëlkovo
125
- - source: Ртищево
126
- expected: Rtishchevo
127
- - source: Подъездной
128
- expected: Podʺezdnoǐ
129
- - source: Ыттык-Кёль
130
- expected: Yttyk-Këlʹ
131
- - source: Тында
132
- expected: Tynda
133
- - source: Тюмень
134
- expected: Ti͡umenʹ
135
- - source: Электрогорск
136
- expected: Ėlektrogorsk
137
- - source: Радиоэлектроника
138
- expected: Radioėlektronika
139
- - source: Юбилейный
140
- expected: I͡Ubileǐnyǐ
141
- - source: Ключевская
142
- expected: Kli͡uchevskai͡a
143
- - source: Якутск
144
- expected: I͡Akutsk
145
- - source: Брянск
146
- expected: Bri͡ansk
147
-
148
- map:
149
- inherit: alalc-rus-Cyrl-Latn-1997
150
-
151
- characters:
152
- '\u0406': "\u012A"
153
- '\u0456': "\u012B"
154
-
155
- '\u0462': "I\u0361E" # Ѣ
156
- '\u0463': "i\u0361e" # ѣ
157
-
158
- '\u0472': "F\u0307" # Ѳ
159
- '\u0473': "f\u0307" # ѳ
160
-
161
- '\u0474': "Y\u0307" # Ѵ
162
- '\u0475': "y\u0307" # ѵ