interscript 0.1.7 → 2.1.0b1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (314) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +116 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +83 -133
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +68 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +68 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +76 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +68 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/lib/interscript/visualize.rb +61 -0
  63. data/lib/interscript/visualize/group.html.erb +59 -0
  64. data/lib/interscript/visualize/json.rb +57 -0
  65. data/lib/interscript/visualize/map.html.erb +46 -0
  66. data/lib/interscript/visualize/nodes.rb +89 -0
  67. data/requirements.txt +1 -0
  68. metadata +78 -416
  69. data/README.adoc +0 -298
  70. data/lib/g2pwrapper.py +0 -34
  71. data/lib/interscript/fs.rb +0 -69
  72. data/lib/interscript/mapping.rb +0 -142
  73. data/lib/interscript/opal.rb +0 -57
  74. data/lib/interscript/opal/entrypoint.rb +0 -12
  75. data/lib/interscript/opal/map_translate.rb +0 -7
  76. data/lib/interscript/opal/maps.js.erb +0 -10
  77. data/lib/model-7 +0 -0
  78. data/lib/tha-pt-b-7 +0 -0
  79. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  80. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  81. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  82. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  83. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
  84. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
  85. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  86. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  87. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  88. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  89. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  90. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  91. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  92. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  93. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
  94. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
  95. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  96. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  97. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  98. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  99. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  100. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  101. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  102. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  103. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  104. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  105. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  106. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  107. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  108. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  109. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  110. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  111. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  112. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
  113. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  114. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  115. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  116. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  117. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  118. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  119. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  120. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  121. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  122. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  123. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  124. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  125. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  126. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  127. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  128. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  129. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  130. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
  131. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  132. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  133. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  134. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  135. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  136. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  137. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  138. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  139. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  140. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  141. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  142. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  143. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  144. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  145. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  146. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  147. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  148. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  149. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  150. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  151. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
  152. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
  153. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  154. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  155. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  156. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  157. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  158. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  159. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  160. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  161. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  162. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  163. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  164. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  165. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  166. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  167. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  168. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  169. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  170. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  171. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  172. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  173. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  174. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  175. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  176. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  177. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  178. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  179. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  180. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  181. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  182. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  183. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  184. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  185. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  186. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  187. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  188. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  189. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  190. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  191. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  192. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  193. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  194. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  195. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  196. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  197. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  198. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  199. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  200. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  201. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  202. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  203. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  204. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  205. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  206. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  207. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  208. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  209. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  210. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  211. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  212. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  213. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
  214. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  215. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  216. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  217. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  218. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  219. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  220. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  221. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  222. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  223. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  224. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  225. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  226. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  227. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  228. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  229. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  230. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  231. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  232. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  233. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  234. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  235. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  236. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  237. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  238. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  239. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  240. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  241. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  242. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  243. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  244. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
  245. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  246. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  247. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  248. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  249. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  250. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  251. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  252. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  253. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  254. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  255. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  256. data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
  257. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  258. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  259. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  260. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  261. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  262. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  263. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  264. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  265. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  266. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  267. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  268. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  269. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  270. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  271. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  272. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  273. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  274. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  275. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  276. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  277. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  278. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  279. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  280. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  281. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  282. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  283. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  284. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  285. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  286. data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
  287. data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
  288. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  289. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  290. data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
  291. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  292. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  293. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  294. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  295. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  296. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  297. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  298. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  299. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  300. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  301. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  302. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  303. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  304. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  305. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  306. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  307. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  308. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  309. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  310. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  311. data/spec/interscript/filenames_spec.rb +0 -384
  312. data/spec/interscript/mapping_spec.rb +0 -42
  313. data/spec/interscript_spec.rb +0 -29
  314. data/spec/spec_helper.rb +0 -3
@@ -1,100 +0,0 @@
1
- ---
2
- authority_id: din
3
- id: 33904-2018
4
- language: iso-639-2:hin
5
- source_script: Deva
6
- destination_script: Latn
7
- name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Hindi"
8
- url: https://www.beuth.de/en/standard/din-33904/293049024
9
- creation_date: 2018
10
- description: |
11
- Hindi system.
12
-
13
- This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
- It is suitable for any application.
15
-
16
- notes:
17
- - |
18
- Vowels:
19
- The Ardhacandra ॅ is often used to denote English vowels:
20
- EXAMPLE
21
- बॅट bêṭa (bat)
22
- डॉक्टर ḍôkṭara (doctor)
23
- - |
24
- Consonants:
25
-
26
- Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
- Always written during transliteration, also in the final part
28
- EXAMPLE 1
29
- पुस्तक pustaka
30
-
31
- A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
- EXAMPLE 2
33
- वाक् vāk
34
-
35
- The anusvāra is always represented with -ṃ-.
36
- EXAMPLE 3
37
- संसकरण saṃskaraṇa
38
-
39
- Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
- EXAMPLE 4
41
- तंघी kaṃghī becomes kaṅghī
42
- पंजाबी paṃjābī becomes pañjābī
43
- पंडित paṃḍita becomes paṇḍita
44
- संधी saṃdhī becomes sandhī
45
- दिसंबर disaṃbara becomes disambara
46
-
47
- Anunāsika or Candrabindu signals the nasalization of vowels
48
-
49
- EXAMPLE 5
50
- माँ māṁ
51
-
52
- tests:
53
- - source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
54
- expected: "gambhīra marījoṃ ke māmale meṃ bhārata dūsare nambara para"
55
- - source: "कोरोना अपडेट्स"
56
- expected: "koronā apaḍeṭsa"
57
- - source: "सीडीसी चीफ का बयान अहम"
58
- expected: "sīḍīsī cīpha kā bayāna ahama"
59
- - source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
60
- expected: "gūgala ple sṭora para peṭīema kī vāpasī"
61
- - source: "भारत में गैंबलिंग की इजाजत नहीं"
62
- expected: "bhārata meṃ gaimbaliṅga kī ijājata nahīṃ"
63
- - source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
64
- expected: "koronā vaiksīna mudde para ghire rāṣṭrapati; jo bāiḍena bole- mujhe aura deśa ko vaijñānikoṃ para bharosā hai, ḍonālḍa ṭrampa para nahīṃ"
65
- - source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
66
- expected: "gūgala kī kārravāī para peṭīema ne kahā thā ki aipa ko asthāyī taura para ple-sṭora se haṭāyā gayā hai, āpake paise surakṣita haiṃ"
67
- - source: "०१९८"
68
- expected: "0198"
69
-
70
-
71
- map:
72
-
73
- inherit: din-san-Deva-Latn-33904-2018
74
-
75
- characters:
76
-
77
- 'ॲ': 'ê'
78
- 'ऑ': 'ô'
79
-
80
- # Dotted variants
81
- 'क़': 'ḵa'
82
- 'ख़': 'ḵha'
83
- 'ग़': 'g̲a' # \u0067 + \u0332
84
- 'ज़': 'j̲a' # \u006a + \u0332
85
- 'ड़': 'ṙa'
86
- 'ढ़': 'ṙha'
87
- 'फ़': 'p̲ha' # \u0070 + \u0332
88
- 'स़': 's̲a' # \u0073 + \u0332
89
- 'ह़': 'h̲a' # \u0068 + \u0332
90
-
91
- # Dotted variants Virāma
92
- 'क़्': 'ḵ'
93
- 'ख़्': 'ḵh'
94
- 'ग़्': 'g̲' # \u0067 + \u0332
95
- 'ज़्': 'j̲' # \u006a + \u0332
96
- 'ड़्': 'ṙ'
97
- 'ढ़्': 'ṙh'
98
- 'फ़्': 'p̲h' # \u0070 + \u0332
99
- 'स़्': 's̲' # \u0073 + \u0332
100
- 'ह़्': 'h̲' # \u0068 + \u0332
@@ -1,145 +0,0 @@
1
- ---
2
- authority_id: din
3
- id: 32707-2010
4
- language: iso-639-2:kat
5
- source_script: Geor
6
- destination_script: Latn
7
- name: "DIN 32707:2010-01 Information und Dokumentation - Umschrift des georgischen Alphabets"
8
- url: https://www.beuth.de/de/norm/din-32707/122821999
9
- creation_date: 2010
10
- confirmation_date: 2010
11
- description: |
12
- Information and documentation - Romanization of the Georgian alphabet.
13
-
14
- notes:
15
-
16
- tests:
17
-
18
- - source: ხაოფსე
19
- expected: xaop̕se
20
-
21
- - source: ჭლოუ
22
- expected: člou
23
-
24
- - source: ჩოხულდი
25
- expected: č̕oxuldi
26
-
27
- - source: ქვემო ლინდა
28
- expected: k̕vemo linda
29
-
30
- - source: ტამკვაჩ იგვავერა
31
- expected: tamkvač̕ igvavera
32
-
33
- - source: სვანეთი
34
- expected: svanet̕i
35
-
36
- - source: საცხვარისი
37
- expected: sac̕xvarisi
38
-
39
- - source: მუხრან-თელეთი
40
- expected: muxran-t̕elet̕i
41
-
42
- - source: მუცდი
43
- expected: muc̕di
44
-
45
- - source: ლეჩხუმი
46
- expected: leč̕xumi
47
-
48
- - source: ვერხნაია მწარა
49
- expected: verxnaia mcara
50
-
51
- - source: ეგრისის ქედი
52
- expected: egrisis k̕edi
53
-
54
- - source: დოჩარიფშა
55
- expected: doč̕arip̕ša
56
-
57
- - source: ბოლოკო
58
- expected: boloko
59
-
60
- - source: აჭანდარა
61
- expected: ačandara
62
-
63
- - source: აუალიცა
64
- expected: aualic̕a
65
-
66
- - source: აკალამრა
67
- expected: akalamra
68
-
69
- - source: ლასილი
70
- expected: lasili
71
-
72
- - source: გუბაზეული
73
- expected: gubazeuli
74
-
75
- - source: ბაყაყი
76
- expected: baqaqi
77
-
78
- - source: ძროხა
79
- expected: jroxa
80
-
81
- - source: ჰაერი
82
- expected: haeri
83
-
84
- - source: ჟოლო
85
- expected: žolo
86
-
87
- - source: ჯართი
88
- expected: ǰart̕i
89
-
90
- - source: ღრმაღელე
91
- expected: ġrmaġele
92
-
93
- map:
94
- characters:
95
- '\u10d0' : 'a' # ა
96
- '\u10d1' : 'b' # ბ
97
- '\u10d2' : 'g' # გ
98
- '\u10d3' : 'd' # დ
99
- '\u10d4' : 'e' # ე
100
- '\u10d5' : 'v' # ვ
101
- '\u10d6' : 'z' # ზ
102
-
103
- '\u10f1' : 'ê' # ჱ
104
-
105
- '\u10d7' : 't̕' # თ
106
- '\u10d8' : 'i' # ი
107
- '\u10d9' : 'k' # კ
108
- '\u10da' : 'l' # ლ
109
- '\u10db' : 'm' # მ
110
- '\u10dc' : 'n' # ნ
111
-
112
- '\u10f2' : 'y' # ჲ
113
-
114
- '\u10dd' : 'o' # ო
115
- '\u10de' : 'p' # პ
116
- '\u10df' : 'ž' # ჟ
117
- '\u10e0' : 'r' # რ
118
- '\u10e1' : 's' # ს
119
- '\u10e2' : 't' # ტ
120
-
121
- '\u10f3' : 'w' # ჳ
122
-
123
- '\u10e3' : 'u' # უ
124
- '\u10e4' : 'p̕' # ფ
125
- '\u10e5' : 'k̕' # ქ
126
- '\u10e6' : 'ġ' # ღ
127
- '\u10e7' : 'q' # ყ
128
- '\u10e8' : 'š' # შ
129
- '\u10e9' : 'č̕' # ჩ
130
- '\u10ea' : 'c̕' # ც
131
- '\u10eb' : 'j' # ძ
132
- '\u10ec' : 'c' # წ
133
- '\u10ed' : 'č' # ჭ
134
- '\u10ee' : 'x' # ხ
135
-
136
- '\u10f4' : 'q̕' # ჴ
137
-
138
- '\u10ef' : 'ǰ' # ჯ
139
- '\u10f0' : 'h' # ჰ
140
-
141
- '\u10f5' : 'ô' # ჵ
142
-
143
- '\u10f6' : 'f' # ჶ
144
- '\u10f7' : 'ẹ' # ჷ
145
- '\u10f8' : 'ʼ' # ჸ
@@ -1,84 +0,0 @@
1
- ---
2
- authority_id: din
3
- id: 33904-2018
4
- language: iso-639-2:mar
5
- source_script: Deva
6
- destination_script: Latn
7
- name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Marathi"
8
- url: https://www.beuth.de/en/standard/din-33904/293049024
9
- creation_date: 2018
10
- description: |
11
- Marathi system.
12
-
13
- Information und Dokumentation - Transliteration Devanagari
14
-
15
- This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
16
- It is suitable for any application.
17
-
18
- notes:
19
- - |
20
- Vowels:
21
- The Ardhacandra ॅ is often used to denote English vowels:
22
- EXAMPLE
23
- बॅट bêṭa (bat)
24
- डॉक्टर ḍôkṭara (doctor)
25
- - |
26
- Consonants:
27
-
28
- Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
29
- Always written during transliteration, also in the final part
30
- EXAMPLE 1
31
- पुस्तक pustaka
32
-
33
- A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
34
- EXAMPLE 2
35
- वाक् vāk
36
-
37
- The anusvāra is always represented with -ṃ-.
38
- EXAMPLE 3
39
- संसकरण saṃskaraṇa
40
-
41
- Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
42
- EXAMPLE 4
43
- तंघी kaṃghī becomes kaṅghī
44
- पंजाबी paṃjābī becomes pañjābī
45
- पंडित paṃḍita becomes paṇḍita
46
- संधी saṃdhī becomes sandhī
47
- दिसंबर disaṃbara becomes disambara
48
-
49
- Anunāsika or Candrabindu signals the nasalization of vowels
50
-
51
- EXAMPLE 5
52
- माँ māṁ
53
-
54
- tests:
55
- - source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
56
- expected: "ṭhāṇe - jilhyāta budhavārī eka hajāra rugṇāñcī vāḍha, tara jaṇāñcyā mṛtyūcī nonda"
57
- - source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
58
- expected: "ekatā kapūra punhā aḍakalī vādāta, vebasīrijamadhalyā 'tyā' sīnamuḷe jamāvācī gharāvara dagaḍapheka"
59
- - source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
60
- expected: "jāṇūna ghyā, bīemasīcyā adhikāऱ्yānnī kaṅganā rāṇautacyā ôphisamadhale nakkī kāya- kāya toḍalaṃ"
61
- - source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
62
- expected: "kaṅganā mumbaīta dākhala hoṇyāpūrvī 'mātośrī'varūna pharmāna suṭale; pravaktyānnā sakta ādeśa"
63
- - source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
64
- expected: "marāṭhā ārakṣaṇāsa tātpuratī sthagitī; sarvocca nyāyālayācā nirṇaya"
65
- - source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
66
- expected: "bhāratācyā tinhī laśīñcā pahilā ṭappā yaśasvī, vācā kadhī yeṇāra bājārāta"
67
- - source: "रुग्णवाढीमुळे खाटांची चणचण"
68
- expected: "rugṇavāḍhīmuḷe khāṭāñcī caṇacaṇa"
69
- - source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
70
- expected: "pīema svanidhī karja yojanelā mumbaītūna alpa pratisāda"
71
- - source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
72
- expected: "sāntākrūjha-cembūra liṅka roḍavarīla unnata mārgālā sthagitī"
73
- - source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
74
- expected: "sampādaka arṇaba gosvāmī yāñcyāvirūddha khaḍaka polisa ṭhāṇyāta takrāra"
75
-
76
-
77
- map:
78
-
79
- inherit: 'din-san-Deva-Latn-33904-2018'
80
-
81
- characters:
82
-
83
- 'ॲ': 'ê'
84
- 'ऑ': 'ô'
@@ -1,119 +0,0 @@
1
- ---
2
- authority_id: din
3
- id: 33904-2018
4
- language: iso-639-2:nep
5
- source_script: Deva
6
- destination_script: Latn
7
- name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Nepali"
8
- url: https://www.beuth.de/en/standard/din-33904/293049024
9
- creation_date: 2018
10
- description: |
11
- Nepali system.
12
-
13
- This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
- It is suitable for any application.
15
-
16
- notes:
17
- - |
18
- Vowels:
19
- The Ardhacandra ॅ is often used to denote English vowels:
20
- EXAMPLE
21
- बॅट bêṭa (bat)
22
- डॉक्टर ḍôkṭara (doctor)
23
- - |
24
- Consonants:
25
-
26
- Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
- Always written during transliteration, also in the final part
28
- EXAMPLE 1
29
- पुस्तक pustaka
30
-
31
- A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
- EXAMPLE 2
33
- वाक् vāk
34
-
35
- The anusvāra is always represented with -ṃ-.
36
- EXAMPLE 3
37
- संसकरण saṃskaraṇa
38
-
39
- Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
- EXAMPLE 4
41
- तंघी kaṃghī becomes kaṅghī
42
- पंजाबी paṃjābī becomes pañjābī
43
- पंडित paṃḍita becomes paṇḍita
44
- संधी saṃdhī becomes sandhī
45
- दिसंबर disaṃbara becomes disambara
46
-
47
- Anunāsika or Candrabindu signals the nasalization of vowels
48
-
49
- EXAMPLE 5
50
- माँ māṁ
51
-
52
- tests:
53
- - source: "लेखन"
54
- expected: "lekhana"
55
- - source: "मुद्रा"
56
- expected: "mudrā"
57
- - source: "प्रशंसा"
58
- expected: "praśaṃsā"
59
- - source: "अंक"
60
- expected: "aṅka"
61
- - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
62
- expected: "nekapāle sthagita sthāyī kamiṭīko baiṭhaka bhadau gate bolāune bhaeko"
63
- - source: "न घर रह्यो, न परिवार"
64
- expected: "na ghara rahyo, na parivāra"
65
- - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
66
- expected: "ḍhorapāṭanamā bhujīkholā bāḍhīpahirole abhibhāvaka gumāekā bālabālikāko bicallī"
67
- - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
68
- expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
69
- - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
70
- expected: "saṃvidhāna jārī bhaesaṁgai sārvajanika praśāsanamā nayāṁ utsāha āune apekṣā thiyo"
71
- - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
72
- expected: "deśamā koronā saṅkramita ra mṛtakako saṅkhyā hareka dina baḍhdo cha"
73
- - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
74
- expected: "gāuṁpālikākā adhyakṣa ṭikā guruṅakā anusāra viṣṇudāsalāī rājule sutnakā lāgi belukā sāthī lagekā thie"
75
- - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
76
- expected: "yo āyojanā gāuṁpālikāko kendra tellokamā parcha"
77
- - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
78
- expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
79
- - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
80
- expected: "caita pahilo sātā ghara āekā unī lakaḍāuna bhaepachi yatai rokie"
81
- - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
82
- expected: "kāma garna jāneko hakamā rojagāradātā kampanīko patrasaṁgai vaḍā ra jillā praśāsanako siphārisa anivārya garieko cha"
83
- - source: "दुःख"
84
- expected: "duḥkha"
85
-
86
-
87
- map:
88
-
89
- inherit: 'din-san-Deva-Latn-33904-2018'
90
-
91
- characters:
92
-
93
- 'ॲ': 'ê'
94
- 'ऑ': 'ô'
95
-
96
- # Dotted variants
97
- 'क़': 'ḵa'
98
- 'ख़': 'ḵha'
99
- 'ग़': 'g̲a' # \u0067 + \u0332
100
- 'ज़': 'j̲a' # \u006a + \u0332
101
- 'ड़': 'ṙa'
102
- 'ढ़': 'ṙha'
103
- 'फ़': 'p̲ha' # \u0070 + \u0332
104
- 'स़': 's̲a' # \u0073 + \u0332
105
- 'ह़': 'h̲a' # \u0068 + \u0332
106
- 'व़': 'v̲a' # \u0076 + \u0332
107
-
108
- # Dotted variants Virāma
109
- 'क़्': 'ḵ'
110
- 'ख़्': 'ḵh'
111
- 'ग़्': 'g̲' # \u0067 + \u0332
112
- 'ज़्': 'j̲' # \u006a + \u0332
113
- 'ड़्': 'ṙ'
114
- 'ढ़्': 'ṙh'
115
- 'फ़्': 'p̲h' # \u0070 + \u0332
116
- 'स़्': 's̲' # \u0073 + \u0332
117
- 'ह़्': 'h̲' # \u0068 + \u0332
118
-
119
-