interscript 0.1.9 → 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (352) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +53 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +80 -135
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +67 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +26 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +61 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +65 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/requirements.txt +1 -0
  63. metadata +73 -458
  64. data/README.adoc +0 -296
  65. data/aliases.json +0 -1
  66. data/lib/g2pwrapper.py +0 -34
  67. data/lib/interscript/fs.rb +0 -96
  68. data/lib/interscript/mapping.rb +0 -144
  69. data/lib/interscript/opal.rb +0 -196
  70. data/lib/interscript/opal/entrypoint.rb +0 -20
  71. data/lib/interscript/opal/exports.rb +0 -11
  72. data/lib/interscript/opal/maps.js.erb +0 -8
  73. data/lib/model-7 +0 -0
  74. data/lib/tha-pt-b-7 +0 -0
  75. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  76. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  77. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  78. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  79. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
  80. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
  81. data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
  82. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  83. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  84. data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
  85. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  86. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  87. data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
  88. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  89. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  90. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  91. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  92. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
  93. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
  94. data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
  95. data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
  96. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  97. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  98. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  99. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  100. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  101. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  102. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  103. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  104. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  105. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  106. data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
  107. data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
  108. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  109. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  110. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  111. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  112. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  113. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  114. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  115. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
  116. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  117. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  118. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  119. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  120. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  121. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  122. data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
  123. data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
  124. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  125. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  126. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  127. data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
  128. data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
  129. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  130. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  131. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  132. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  133. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  134. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  135. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  136. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  137. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
  138. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  139. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
  140. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  141. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
  142. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  143. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  144. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  145. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  146. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
  147. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  148. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  149. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
  150. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  151. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
  152. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  153. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  154. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  155. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
  156. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
  157. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  158. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  159. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  160. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
  161. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  162. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  163. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  164. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  165. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
  166. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
  167. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  168. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
  169. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  170. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  171. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
  172. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  173. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  174. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  175. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  176. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  177. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
  178. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  179. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  180. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  181. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  182. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  183. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  184. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  185. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
  186. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  187. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
  188. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  189. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  190. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  191. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  192. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  193. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  194. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  195. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  196. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  197. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  198. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  199. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  200. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  201. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  202. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  203. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  204. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  205. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  206. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  207. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  208. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  209. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  210. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  211. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  212. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  213. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  214. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  215. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  216. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  217. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  218. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  219. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  220. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  221. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  222. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  223. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  224. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  225. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  226. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  227. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  228. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  229. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  230. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
  231. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  232. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  233. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  234. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  235. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  236. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  237. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  238. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  239. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  240. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  241. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  242. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  243. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  244. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  245. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  246. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  247. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  248. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  249. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  250. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  251. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  252. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  253. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  254. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  255. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  256. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  257. data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
  258. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  259. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  260. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  261. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  262. data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
  263. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
  264. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  265. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  266. data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
  267. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  268. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  269. data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
  270. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  271. data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
  272. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  273. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  274. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  275. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  276. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  277. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
  278. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  279. data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
  280. data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
  281. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  282. data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
  283. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  284. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  285. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  286. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
  287. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  288. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
  289. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  290. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  291. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  292. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  293. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  294. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  295. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  296. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  297. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  298. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  299. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  300. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  301. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  302. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  303. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  304. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  305. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  306. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  307. data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
  308. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  309. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  310. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  311. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  312. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  313. data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
  314. data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
  315. data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
  316. data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
  317. data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
  318. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  319. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  320. data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
  321. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  322. data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
  323. data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
  324. data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
  325. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  326. data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
  327. data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
  328. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  329. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  330. data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
  331. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
  332. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
  333. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  334. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  335. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  336. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  337. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  338. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  339. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  340. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  341. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  342. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  343. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  344. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  345. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  346. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  347. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  348. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  349. data/spec/interscript/filenames_spec.rb +0 -21
  350. data/spec/interscript/mapping_spec.rb +0 -42
  351. data/spec/interscript_spec.rb +0 -37
  352. data/spec/spec_helper.rb +0 -3
@@ -1,71 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2011
4
- language: iso-639-2:sin
5
- source_script: Sinh
6
- destination_script: Latn
7
- name: Sinhalese Romanization, 2011
8
- alias:
9
- ogc11122:
10
- code: sin_Sinh2Latn_ALA_2011
11
- description: Sinhalese ALA-Library of Congress 2011 System
12
- url: https://www.loc.gov/catdir/cpso/romanization/sinhales.pdf
13
- creation_date: 2011
14
- description: |
15
- ALA-LC Romanization table for Sinhalese
16
-
17
-
18
- notes:
19
-
20
- - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
21
- vowels following a consonant can be found in grammars; no distinction between the two is
22
- made in transliteration.
23
-
24
- - |
25
- The vowel a is implicit after all consonants and consonant clusters and is supplied in
26
- transliteration, with the following exceptions:
27
-
28
- a) when another vowel is indicated by its appropriate sign; and
29
- b) when the absence of any vowel is indicated by the sign ් called virāma.
30
-
31
- - |
32
- Exceptions: Anusvāra is transliterated by:
33
-
34
- a) ṅ before gutturals,
35
- b) ñ before palatals,
36
- c) ṇ before cerebrals,
37
- d) n before dentals, and
38
- e) m before labials.
39
-
40
- - |
41
- Exceptions:
42
- a) when saññaka represents a nasal, it is romanized according to the rule for anusvāra.
43
- b) when saññaka is combined with an aspirated consonant, the combination is romanized as a non-aspirated, followed by an aspirated consonant.
44
-
45
-
46
- tests:
47
- - source: "හිටපු අග්‍රාමාත්‍ය රනිල් වික්‍රමසිංහ අප්‍රේල් 21 ප්‍රහාරය සම්බන්ධයෙන් විමර්ශනය කරන ජනාධිපති පරීක්ෂණ කොමිසම හමුවේ දෙවෙනි දිනටත් සාක්ෂි ලබාදීමට පැමිණෙයි"
48
- expected: "hiṭapu agrāmātya ranil vikramasiṃha aprēl 21 prahāraya sambanandhayen vimarśanaya karana janādhipati parīkṣaṇa komisama hamuvē deveni dinaṭat sākṣi labādīmaṭa pămiṇeyi"
49
- - source: "පෑලියගොඩ මත්ස්‍ය තොග වෙළෙදපොළට පිවිසෙන පිවිසුම් මාර්ගය පුළුල් කර සංවර්ධනයට පියවර - මහාමාර්ග අමාත්‍ය ජොන්ස්ටන් ප්‍රනාන්දු"
50
- expected: "pâliyagoḍa matsya toga veḷedapoḷaṭa pivisena pivisum māraṅgaya puḷul kara saṃvarandhanayaṭa piyavara - mahāmāraṅga amātya jonsaṇṭan pranānandu"
51
- - source: "මව්බිමටත් රට වැසියන්ටත් ආශිර්වාද කරමින් වි⁣ශේෂ ආගමික වැඩසටහන් මාලාවක්"
52
- expected: "mavbimaṭat raṭa văsiyanaṇṭat āśirvāda karamin vi⁣śēṣa āgamika văḍasaṭahan mālāvak"
53
- - source: "මිනුවන්ගොඩ කොරෝනා පොකුරින් තවත් ආසාදිතයින් 49 දෙනකු හඳුනා ගෙන"
54
- expected: "minuvanaṅgoḍa korōnā pokurin tavat āsāditayin 49 denaku handunā gena"
55
- - source: "ඉරණවිල වෙරළේ නාඳුනන ධීවර යාත‍්‍රා දෙකක්"
56
- expected: "iraṇavila veraḷē nāndunana dhīvara yātarā dekak"
57
- - source: "මඩකලපුව මංගලාරාමේ හාමුදුරුවන්ට මරණ තර්ජන - ආරක්ෂාවත් අඩුකරලා"
58
- expected: "maḍakalapuva maṃgalārāmē hāmuduruvanaṇṭa maraṇa tarañjana - ārakṣāvat aḍukaralā"
59
- - source: "හොරට කහ කුඩු හැදූ දෙදෙනෙක් බඩුත් එක්ක දැලේ"
60
- expected: "horaṭa kaha kuḍu hădū dedenek baḍut ekaṅka dălē"
61
- - source: "ඉංගිරියේ ජලභීතිකාව වැළඳුනු නරියෙකු තෙදිනක මෙහෙයුමකින් අල්ලා ගනී"
62
- expected: "iṃgiriyē jalabhītikāva văḷandunu nariyeku tedinaka meheyumakin allā ganī"
63
- - source: "බෞද්ධ දර්ශනයට අනුව අපි උපයන ධනය බුද්ධිමත් ලෙස විසර්ජනය කරන්නේ කෙසේ ද?"
64
- expected: "baudandha darśanayaṭa anuva api upayana dhanaya budandhimat lesa visarañjanaya karanannē kesē da?"
65
- - source: "ඉන්දීය ජාතිකයන් සමග එක්වන මන්නාරමේ ධීවරයන්ට අනතුරු අගවයි"
66
- expected: "inandīya jātikayan samaga ekvana manannāramē dhīvarayanaṇṭa anaturu agavayi"
67
- - source: "තේ නැවත වගාවට පෙර පස පුනරුත්ථාපනයට කෙටි මග"
68
- expected: "tē năvata vagāvaṭa pera pasa punarutanthāpanayaṭa keṭi maga"
69
-
70
- map:
71
- inherit: 'alalc-sin-Sinh-Latn-1997'
@@ -1,118 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 1997
4
- language: iso-639-2:srp
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: Serbian and Makedonian Romanization, ALA-LC 1997 System
8
- alias:
9
- ogc11122:
10
- code: srp_Cyrl2Latn_ALA_1997
11
- description: Serbian and Macedonian ALA-Library of Congress 1997 System
12
- url: http://catdir.loc.gov/catdir/cpso/romanization/serbian.pdf
13
- creation_date: 1997
14
- description: ALA-LC Romanization table for Serbian and Makedonian.
15
-
16
- notes:
17
- - Special characters in romanization
18
- Đ - D with crossbar (upper case). USMARC hexadecimal code A3.
19
- đ - d with crossbar (upper case). USMARC hexadecimal code B3.
20
-
21
- - Character modifiers in romanization
22
- ´ - acute. USMARC hexadecimal code E2.
23
- ˇ - hachek. USMARC hexadecimal code E9.
24
-
25
- tests:
26
- - source: Општина Ердут
27
- expected: Opština Erdut
28
- - source: Општина Двор
29
- expected: Opština Dvor
30
- - source: ЛУЃЕ луѓе
31
- expected: LUǴE luǵe
32
- - source: ЅВЕЗДА ѕвезда Ѕвезда
33
- expected: DZVEZDA dzvezda Dzvezda
34
- - source: ЌАРУВАЊЕ ќарување
35
- expected: ḰARUVANJE ḱaruvanje
36
-
37
- map:
38
- postrules:
39
- # DZ
40
- - pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
41
- result: "DZ"
42
- #LJ
43
- - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
44
- result: "LJ"
45
- #NJ
46
- - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
47
- result: "NJ"
48
- #DŽ
49
- - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
50
- result: "DŽ"
51
-
52
- characters:
53
- "\u0410": "A"
54
- "\u0411": "B"
55
- "\u0412": "V"
56
- "\u0413": "G"
57
- "\u0403": "\u01F4" # Ǵ
58
- "\u0414": "D"
59
- "\u0402": "\u0110" # Đ
60
- "\u0415": "E"
61
- "\u0416": "\u005a\u030c" # Ž
62
- "\u0417": "Z"
63
- "\u0405": "Dz"
64
- "\u0418": "I"
65
- "\u0408": "J"
66
- "\u041A": "K"
67
- "\u040C": "\u1E30" # Ḱ
68
- "\u041B": "L"
69
- "\u0409": "Lj"
70
- "\u041C": "M"
71
- "\u041D": "N"
72
- "\u040A": "Nj"
73
- "\u041E": "O"
74
- "\u041F": "P"
75
- "\u0420": "R"
76
- "\u0421": "S"
77
- "\u0422": "T"
78
- "\u040B": "\u0043\u0301" # Ć
79
- "\u0423": "U"
80
- "\u0424": "F"
81
- "\u0425": "H"
82
- "\u0426": "C"
83
- "\u0427": "\u0043\u030c" # Č
84
- "\u040F": "D\u007a\u030c" # Dž
85
- "\u0428": "\u0053\u030c" # Š
86
- "\u0430": "a"
87
- "\u0431": "b"
88
- "\u0432": "v"
89
- "\u0433": "g"
90
- "\u0453": "\u01F5" # ǵ
91
- "\u0434": "d"
92
- "\u0452": "\u0111" # đ
93
- "\u0435": "e"
94
- "\u0436": "\u007a\u030c" # ž
95
- "\u0437": "z"
96
- "\u0455": "dz"
97
- "\u0438": "i"
98
- "\u0458": "j"
99
- "\u043A": "k"
100
- "\u045C": "\u1E31" # ḱ
101
- "\u043B": "l"
102
- "\u0459": "lj"
103
- "\u043C": "m"
104
- "\u043D": "n"
105
- "\u045A": "nj"
106
- "\u043E": "o"
107
- "\u043F": "p"
108
- "\u0440": "r"
109
- "\u0441": "s"
110
- "\u0442": "t"
111
- "\u045B": "\u0063\u0301" # ć
112
- "\u0443": "u"
113
- "\u0444": "f"
114
- "\u0445": "h"
115
- "\u0446": "c"
116
- "\u0447": "\u0063\u030c" # č
117
- "\u045F": "d\u007a\u030c" # dž
118
- "\u0448": "\u0073\u030c" # š
@@ -1,135 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2013
4
- language: iso-639-2:srp
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: ROMANIZATION OF SERBIAN, ALA-LC 2013 System
8
- url: https://www.loc.gov/catdir/cpso/romanization/serbian.pdf
9
- creation_date: 2013
10
- description: |
11
- Serbian uses the Cyrillic and Roman alphabets. When the Roman alphabet is used it is the same as Croatian.
12
-
13
- tests:
14
- - source: Шупља Стена
15
- expected: Šuplja Stena
16
- - source: Чукарица
17
- expected: Čukarica
18
- - source: Црна Трава
19
- expected: Crna Trava
20
- - source: Херцег Нови
21
- expected: Herceg Novi
22
- - source: Улцињ
23
- expected: Ulcinj
24
- - source: Ужице
25
- expected: Užice
26
- - source: Тресаначка Река
27
- expected: Tresanačka Reka
28
- - source: Сјеница
29
- expected: Sjenica
30
- - source: Рожаје
31
- expected: Rožaje
32
- - source: Пљевља
33
- expected: Pljevlja
34
- - source: Оџаци
35
- expected: Odžaci
36
- - source: Никшић
37
- expected: Nikšić
38
- - source: Медвеђа
39
- expected: Medveđa
40
- - source: Лозница
41
- expected: Loznica
42
- - source: Књажевац
43
- expected: Knjaževac
44
- - source: Зрењанин
45
- expected: Zrenjanin
46
- - source: Житорађа
47
- expected: Žitorađa
48
- - source: Ервеник
49
- expected: Ervenik
50
- - source: Доње Љупче
51
- expected: Donje Ljupče
52
- - source: Гусиње
53
- expected: Gusinje
54
- - source: ГУСИЊЕ
55
- expected: GUSINJE
56
- - source: Врњачка Бања
57
- expected: Vrnjačka Banja
58
- - source: Бијело Поље
59
- expected: Bijelo Polje
60
- - source: Алибунар
61
- expected: Alibunar
62
-
63
- map:
64
- postrules:
65
- #LJ
66
- - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
67
- result: "LJ"
68
- #NJ
69
- - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
70
- result: "NJ"
71
- #DŽ
72
- - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
73
- result: "DŽ"
74
-
75
- characters:
76
- "\u0410": "A"
77
- "\u0411": "B"
78
- "\u0412": "V"
79
- "\u0413": "G"
80
- "\u0414": "D"
81
- "\u0402": "\u0110" # Đ
82
- "\u0415": "E"
83
- "\u0416": "\u005a\u030c" # Ž
84
- "\u0417": "Z"
85
- "\u0418": "I"
86
- "\u0408": "J"
87
- "\u041A": "K"
88
- "\u041B": "L"
89
- "\u0409": "Lj"
90
- "\u041C": "M"
91
- "\u041D": "N"
92
- "\u040A": "Nj"
93
- "\u041E": "O"
94
- "\u041F": "P"
95
- "\u0420": "R"
96
- "\u0421": "S"
97
- "\u0422": "T"
98
- "\u040B": "\u0043\u0301" # Ć
99
- "\u0423": "U"
100
- "\u0424": "F"
101
- "\u0425": "H"
102
- "\u0426": "C"
103
- "\u0427": "\u0043\u030c" # Č
104
- "\u040F": "D\u007a\u030c" # Dž
105
- "\u0428": "\u0053\u030c" # Š
106
- "\u0430": "a"
107
- "\u0431": "b"
108
- "\u0432": "v"
109
- "\u0433": "g"
110
- "\u0434": "d"
111
- "\u0452": "\u0111" # đ
112
- "\u0435": "e"
113
- "\u0436": "\u007a\u030c" # ž
114
- "\u0437": "z"
115
- "\u0438": "i"
116
- "\u0458": "j"
117
- "\u043A": "k"
118
- "\u043B": "l"
119
- "\u0459": "lj"
120
- "\u043C": "m"
121
- "\u043D": "n"
122
- "\u045A": "nj"
123
- "\u043E": "o"
124
- "\u043F": "p"
125
- "\u0440": "r"
126
- "\u0441": "s"
127
- "\u0442": "t"
128
- "\u045B": "\u0063\u0301" # ć́
129
- "\u0443": "u"
130
- "\u0444": "f"
131
- "\u0445": "h"
132
- "\u0446": "c"
133
- "\u0447": "\u0063\u030c" # č
134
- "\u045F": "d\u007a\u030c" # dž
135
- "\u0448": "\u0073\u030c" # š
@@ -1,62 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 1997
4
- language: iso-639-2:tam
5
- source_script: Taml
6
- destination_script: Latn
7
- name: Tamil Romanization, 1997
8
- alias:
9
- ogc11122:
10
- code: tam_Taml2Latn_ALA_1997
11
- description: Tamil ALA-Library of Congress 1997 System
12
- url: http://catdir.loc.gov/catdir/cpso/romanization/tamil.pdf
13
- creation_date: 1997
14
- description: |
15
- ALA-LC Romanization table for Tamil
16
-
17
- notes:
18
-
19
- - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
20
- vowels following a consonant can be found in grammars; no distinction between the two is
21
- made in transliteration.
22
-
23
- - |
24
- The vowel a is implicit after all consonants and consonant clusters and is supplied in
25
- transliteration, with the following exceptions:
26
-
27
- a) when another vowel is indicated by its appropriate sign; and
28
- b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
29
-
30
- - This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
31
-
32
- tests:
33
- - source: "அழிந்து போன நகரத்தில் , தொலைந்து போன நான்"
34
- expected: "aḻintu pōṉa nakarattil , tolaintu pōṉa nāṉ"
35
- - source: "முதன் முதலாக - மை ஃபர்ஸ்ட் சோலோ ட்ராவல்"
36
- expected: "mutaṉ mutalāka - mai ḵaparsṭ cōlō ṭrāval"
37
- - source: "வாழ்க்கையில் அவன் போன முதல் சோலோ டிரிப் அது தான்."
38
- expected: "vāḻkkaiyil avaṉ pōṉa mutal cōlō ṭirip atu tāṉ."
39
- - source: "ஸ்கூல் ப்ரெண்ட் கார்த்திக் வீட்டுக்கு போய்ட்டு"
40
- expected: "skūl preṇṭ kārttik vīṭṭukku pōyṭṭu"
41
- - source: "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ"
42
- expected: "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
43
- - source: "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ"
44
- expected: "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
45
- - source: "டார்பிடோவை ஏவ உதவும் சூப்பர்சானிக் ஏவுகணையான ஸ்மார்ட் சோதனை வெற்றி"
46
- expected: "ṭārpiṭōvai ēva utavum cūpparcāṉik ēvukaṇaiyāṉa smārṭ cōtaṉai veṟṟi"
47
- - source: "இந்த ஆண்டு மருத்துவத்துக்கான நோபல் பரிசு பெறுபவர்களின் பெயர்கள் அறிவிப்பு"
48
- expected: "inta āṇṭu maruttuvattukkāṉa nōpal paricu peṟupavarkaḷiṉ peyarkaḷ aṟivippu"
49
- - source: "மல்லையா விவகாரம்: பிரிட்டன் அரசின் நடவடிக்கைகள் தங்களுக்கு தெரியவில்லை - மத்திய அரசு தகவல்"
50
- expected: "mallaiyā vivakāram: piriṭṭaṉ araciṉ naṭavaṭikkaikaḷ taṅkaḷukku teriyavillai - mattiya aracu takaval"
51
- - source: "ஆலோசனைக்குப் பிறகு தேனியில் இருந்து சென்னை புறப்பட்டார் துணை முதலமைச்சர் பன்னீர்செல்வம்"
52
- expected: "ālōcaṉaikkup piṟaku tēṉiyil iruntu ceṉṉai puṟappaṭṭār tuṇai mutalamaiccar paṉṉīrcelvam"
53
- - source: "இன்று தான் பேரன் பிறந்தநாள் முடிந்து ஃப்ரீ ஆகி இருக்கிறேன்"
54
- expected: "iṉṟu tāṉ pēraṉ piṟantanāḷ muṭintu ḵaprī āki irukkiṟēṉ"
55
-
56
- map:
57
-
58
- inherit: 'din-tam-Taml-Latn-33903-2016'
59
-
60
- characters:
61
-
62
- 'ஃ': 'ḵa'
@@ -1,58 +0,0 @@
1
- ---
2
- authority_id: alalc
3
- id: 2011
4
- language: iso-639-2:tam
5
- source_script: Taml
6
- destination_script: Latn
7
- name: Tamil Romanization, 2011
8
- alias:
9
- ogc11122:
10
- code: tam_Taml2Latn_ALA_2011
11
- description: Tamil ALA-Library of Congress 2011 System
12
- url: https://www.loc.gov/catdir/cpso/romanization/tamil.pdf
13
- creation_date: 2011
14
- description: |
15
- ALA-LC Romanization table for Tamil
16
-
17
- notes:
18
-
19
- - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
20
- vowels following a consonant can be found in grammars; no distinction between the two is
21
- made in transliteration.
22
-
23
- - |
24
- The vowel a is implicit after all consonants and consonant clusters and is supplied in
25
- transliteration, with the following exceptions:
26
-
27
- a) when another vowel is indicated by its appropriate sign; and
28
- b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
29
-
30
- - This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
31
-
32
- tests:
33
- - source: "மலையாள நடிகர் சங்கத்திலிருந்து நடிகை பார்வதி திடீர் விலகல்."
34
- expected: "malaiyāḷa naṭikar caṅkattiliruntu naṭikai pārvati tiṭīr vilakal."
35
- - source: "சச்சின் டெண்டுல்கரை அலுவலக உதவியாளராக நியமிப்பீர்களா?"
36
- expected: "cacciṉ ṭeṇṭulkarai aluvalaka utaviyāḷarāka niyamippīrkaḷā?"
37
- - source: "அமீரகத்தில் தொலைநோக்கி இல்லாமல் நாளை பார்க்கலாம்"
38
- expected: "amīrakattil tolainōkki illāmal nāḷai pārkkalām"
39
- - source: "லடாக் யூனியன் பிரதேசம் இந்தியா சட்டவிரோதமாக நிறுவிய ஒரு பகுதி- சீனா மீண்டும் பிடிவாதம்"
40
- expected: "laṭāk yūṉiyaṉ piratēcam intiyā caṭṭavirōtamāka niṟuviya oru pakuti- cīṉā mīṇṭum piṭivātam"
41
- - source: "பாலியல் குற்றங்களில் ஈடுபடுவோருக்கு மரண தண்டனை புதிய சட்டம்"
42
- expected: "pāliyal kuṟṟaṅkaḷil īṭupaṭuvōrukku maraṇa taṇṭaṉai putiya caṭṭam"
43
- - source: "புதுடெல்லி"
44
- expected: "putuṭelli"
45
- - source: "அப்படி விளம்பரத்தில என்ன இருக்கு...?"
46
- expected: "appaṭi viḷamparattila eṉṉa irukku...?"
47
- - source: "பூமிக்கும், செவ்வாய் கிரகத்துக்கும் இடையிலான அதிகபட்ச தூரம் ௪௦ கோடியே ௧௩ லட்சம் கி.மீ தொலைவு ஆகும்."
48
- expected: "pūmikkum, cevvāy kirakattukkum iṭaiyilāṉa atikapaṭca tūram 40 kōṭiyē 13 laṭcam ki.mī tolaivu ākum."
49
- - source: "அமீரகத்தில் செவ்வாய் கிரகம் குறித்த ஆய்வில் ஈடுபடுவோர் மற்றும் வானியல் நிபுணர்களுக்கு இது ஒரு நல்ல வாய்ப்பாக அமையும்."
50
- expected: "amīrakattil cevvāy kirakam kuṟitta āyvil īṭupaṭuvōr maṟṟum vāṉiyal nipuṇarkaḷukku itu oru nalla vāyppāka amaiyum."
51
- - source: "நள்ளிரவு நேரமாக இருந்தால் நமது தலைக்கு மேலே காணலாம். காலை நேரத்தில் மேற்கு மற்றும் தென்மேற்கு திசையில் செவ்வாய் கிரகத்தை பார்க்கலாம்."
52
- expected: "naḷḷiravu nēramāka iruntāl namatu talaikku mēlē kāṇalām. kālai nērattil mēṟku maṟṟum teṉmēṟku ticaiyil cevvāy kirakattai pārkkalām."
53
- - source: "வெறும் கண்ணால் பார்க்கும்போது புள்ளியாக ஆரஞ்சு நிறத்தில் பிரகாசமாக தெரியும்."
54
- expected: "veṟum kaṇṇāl pārkkumpōtu puḷḷiyāka ārañcu niṟattil pirakācamāka teriyum."
55
-
56
- map:
57
-
58
- inherit: 'alalc-tam-Taml-Latn-1997'