interscript 0.1.9 → 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (352) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +53 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +80 -135
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +67 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +26 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +61 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +65 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/requirements.txt +1 -0
  63. metadata +73 -458
  64. data/README.adoc +0 -296
  65. data/aliases.json +0 -1
  66. data/lib/g2pwrapper.py +0 -34
  67. data/lib/interscript/fs.rb +0 -96
  68. data/lib/interscript/mapping.rb +0 -144
  69. data/lib/interscript/opal.rb +0 -196
  70. data/lib/interscript/opal/entrypoint.rb +0 -20
  71. data/lib/interscript/opal/exports.rb +0 -11
  72. data/lib/interscript/opal/maps.js.erb +0 -8
  73. data/lib/model-7 +0 -0
  74. data/lib/tha-pt-b-7 +0 -0
  75. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  76. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  77. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  78. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  79. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
  80. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
  81. data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
  82. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  83. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  84. data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
  85. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  86. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  87. data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
  88. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  89. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  90. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  91. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  92. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
  93. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
  94. data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
  95. data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
  96. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  97. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  98. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  99. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  100. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  101. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  102. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  103. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  104. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  105. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  106. data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
  107. data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
  108. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  109. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  110. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  111. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  112. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  113. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  114. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  115. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
  116. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  117. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  118. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  119. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  120. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  121. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  122. data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
  123. data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
  124. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  125. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  126. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  127. data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
  128. data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
  129. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  130. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  131. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  132. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  133. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  134. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  135. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  136. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  137. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
  138. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  139. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
  140. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  141. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
  142. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  143. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  144. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  145. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  146. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
  147. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  148. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  149. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
  150. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  151. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
  152. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  153. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  154. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  155. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
  156. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
  157. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  158. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  159. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  160. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
  161. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  162. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  163. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  164. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  165. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
  166. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
  167. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  168. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
  169. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  170. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  171. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
  172. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  173. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  174. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  175. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  176. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  177. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
  178. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  179. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  180. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  181. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  182. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  183. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  184. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  185. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
  186. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  187. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
  188. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  189. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  190. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  191. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  192. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  193. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  194. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  195. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  196. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  197. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  198. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  199. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  200. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  201. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  202. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  203. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  204. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  205. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  206. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  207. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  208. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  209. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  210. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  211. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  212. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  213. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  214. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  215. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  216. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  217. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  218. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  219. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  220. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  221. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  222. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  223. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  224. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  225. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  226. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  227. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  228. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  229. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  230. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
  231. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  232. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  233. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  234. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  235. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  236. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  237. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  238. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  239. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  240. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  241. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  242. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  243. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  244. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  245. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  246. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  247. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  248. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  249. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  250. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  251. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  252. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  253. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  254. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  255. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  256. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  257. data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
  258. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  259. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  260. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  261. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  262. data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
  263. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
  264. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  265. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  266. data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
  267. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  268. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  269. data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
  270. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  271. data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
  272. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  273. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  274. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  275. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  276. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  277. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
  278. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  279. data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
  280. data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
  281. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  282. data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
  283. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  284. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  285. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  286. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
  287. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  288. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
  289. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  290. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  291. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  292. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  293. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  294. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  295. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  296. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  297. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  298. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  299. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  300. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  301. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  302. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  303. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  304. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  305. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  306. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  307. data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
  308. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  309. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  310. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  311. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  312. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  313. data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
  314. data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
  315. data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
  316. data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
  317. data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
  318. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  319. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  320. data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
  321. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  322. data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
  323. data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
  324. data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
  325. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  326. data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
  327. data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
  328. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  329. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  330. data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
  331. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
  332. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
  333. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  334. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  335. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  336. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  337. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  338. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  339. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  340. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  341. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  342. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  343. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  344. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  345. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  346. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  347. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  348. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  349. data/spec/interscript/filenames_spec.rb +0 -21
  350. data/spec/interscript/mapping_spec.rb +0 -42
  351. data/spec/interscript_spec.rb +0 -37
  352. data/spec/spec_helper.rb +0 -3
@@ -1,780 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: 1987-phonetic
4
- language: iso-639-2:ell
5
- source_script: Grek
6
- destination_script: Latn
7
- name: UNGEGN Greek v1.0, Fifth United Nations Conference on the Standardization of Geographical Names. Writing Systems and Guides to Pronunciation Romanization > Conversion of the Greek alphabet into Latin characters. Paper submitted by Greece and Cyprus.
8
- url: http://www.eki.ee/wgrs/rom1_el.htm
9
- creation_date: 1987
10
- description: |
11
- UNGEGN Romanization table for Greek: Phonetic transcription
12
-
13
-
14
- note:
15
- - Also included in ISO 843:1997, Annex B, Column 5, and ELOT 743:1982, column 5.
16
- - Corrected obvious errors, which occur every time the table has reappeared: χ > x, x > ks, oï > oi.
17
- - The vowels are taken from the specification, but some are controversial: /ɑ ɛ/ but /o/.
18
- - Stress is not indicated. (To do so in IPA would require syllabification in preprocessing, since stress is positioned at syllable breaks)
19
- - Followed specification in treating final μπ as b, but final ντ as nd. That distinction is dubious. (In ELOT 743:1982, both d and nd are erroneously marked as initial, and no final is given.)
20
- - τζ is not correctly transcribed as dz: fixed
21
- - not reducing geminated consonants: fixed
22
-
23
- tests:
24
-
25
- - source: |
26
- Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί,
27
-
28
- και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι·
29
-
30
- όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ.
31
-
32
- Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος.
33
-
34
- Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»·
35
-
36
- όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ».
37
-
38
- Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
39
-
40
- Γιάννης Μακρυγιάννης.
41
-
42
- expected: |
43
- ɛnɑ prɑmɑ monon mɛ pɑrɑkinisɛ ki ɛmɛnɑ nɑ ɣrɑpso oti tutin tin pɑtriðɑ tin ɛxomɛn oli mɑzi,
44
-
45
- kɛ sofi ki ɑmɑθis kɛ plusii kɛ ftoxi kɛ politiki kɛ strɑtiotiki kɛ i plɛon mikrotɛri ɑnθropi;
46
-
47
- osi ɑɣonistikɑmɛn, ɑnɑloɣos o kɑθis, ɛxomɛn nɑ zisomɛn ɛðo.
48
-
49
- to lipon ðulɛpsɑmɛn oli mɑzi, nɑ tin filɑmɛn ki oli mɑzi kɛ nɑ min lɛɣi utɛ o ðinɑtos «ɛɣo» utɛ o ɑðinɑtos.
50
-
51
- ksɛrɛtɛ potɛ nɑ lɛɣi o kɑθis «ɛɣo»? otɑn ɑɣonisti monos tu kɛ fkiɑsi i xɑlɑsi, nɑ lɛɣi «ɛɣo»;
52
-
53
- otɑn omos ɑɣonizondɛ poli kɛ fkiɑnun, totɛ nɑ lɛnɛ «ɛmis». imɑstɛ is to «ɛmis» ki oxi is to «ɛɣo».
54
-
55
- kɛ is to ɛksis nɑ mɑθomɛn ɣnosi, ɑn θɛlomɛn nɑ fkiɑsomɛn xorion, nɑ zisomɛn oli mɑzi.
56
-
57
- ɣiɑnis mɑkriɣiɑnis.
58
-
59
-
60
- - source: ΑΘΗΝΑ
61
- expected: ɑθinɑ
62
- - source: μπαμπάκι
63
- expected: bɑmbɑki
64
- - source: νταντά
65
- expected: dɑndɑ
66
- - source: γκέγκε
67
- expected: ɡɛŋɡɛ
68
- - source: Γκαμπόν
69
- expected: ɡɑmbon
70
- - source: Μάγχη
71
- expected: mɑnxi
72
- - source: κογξ
73
- expected: konks
74
- - source: υιός
75
- expected: ios
76
- - source: Υιός
77
- expected: ios
78
- - source: νεράντζι
79
- expected: nɛrɑndzi
80
- - source: Γοίθιος
81
- expected: ɣiθios
82
- - source: μπέικον
83
- expected: bɛikon
84
- - source: μπέϊκον
85
- expected: bɛikon
86
- - source: βόλεϊ
87
- expected: volɛi
88
- - source: αθεΐα
89
- expected: ɑθɛiɑ
90
- - source: Εϊγιαφιάτλαγιοκουτλ
91
- expected: ɛiɣiɑfiɑtlɑɣiokutl
92
- - source: Εΐτζι
93
- expected: ɛidzi
94
- - source: Μυρτώο
95
- expected: mirtoo
96
- - source: αέρας
97
- expected: ɑɛrɑs
98
- - source: γαυ γαυ
99
- expected: ɣɑf ɣɑf
100
- - source: Ταΰγετος
101
- expected: tɑiɣɛtos
102
- - source: σπρέυ
103
- expected: sprɛi
104
-
105
- - source: Αθήνα
106
- expected: ɑθinɑ
107
- - source: Άγιον Όρος
108
- expected: ɑɣion oros
109
- - source: Άγραφα
110
- expected: ɑɣrɑfɑ
111
- - source: Αγρίνιο
112
- expected: ɑɣrinio
113
- - source: Αίγινα
114
- expected: ɛɣinɑ
115
- - source: Αίγιο
116
- expected: ɛɣio
117
- - source: Αλεξανδρούπολη
118
- expected: ɑlɛksɑnðrupoli
119
- - source: Αλεποχώρι
120
- expected: ɑlɛpoxori
121
- - source: Αμοργός
122
- expected: ɑmorɣos
123
- - source: Άμφισσα
124
- expected: ɑmfisɑ
125
- - source: Αράχωβα
126
- expected: ɑrɑxovɑ
127
- - source: Άργος
128
- expected: ɑrɣos
129
- - source: Αρκαδία
130
- expected: ɑrkɑðiɑ
131
- - source: Άρτα
132
- expected: ɑrtɑ
133
- - source: Βελούχι
134
- expected: vɛluxi
135
- - source: Βέροια
136
- expected: vɛriɑ
137
- - source: Βοιωτία
138
- expected: viotiɑ
139
- - source: Βόλος
140
- expected: volos
141
- - source: Βόνιτσα
142
- expected: vonitsɑ
143
- - source: Γαλαξίδι
144
- expected: ɣɑlɑksiði
145
- - source: Γαλάτσι
146
- expected: ɣɑlɑtsi
147
- - source: Γιαννιτσά
148
- expected: ɣiɑnitsɑ
149
- - source: Γλυφάδα
150
- expected: ɣlifɑðɑ
151
- - source: Γρανίτσα
152
- expected: ɣrɑnitsɑ
153
- - source: Γρεβενά
154
- expected: ɣrɛvɛnɑ
155
- - source: Γύθειο
156
- expected: ɣiθio
157
- - source: Διόνυσος
158
- expected: ðionisos
159
- - source: Δίστομο
160
- expected: ðistomo
161
- - source: Δολιανά
162
- expected: ðoliɑnɑ
163
- - source: Δράμα
164
- expected: ðrɑmɑ
165
- - source: Δωδεκάνησα
166
- expected: ðoðɛkɑnisɑ
167
- - source: Έδεσσα
168
- expected: ɛðɛsɑ
169
- - source: Ελευσίνα
170
- expected: ɛlɛfsinɑ
171
- - source: Επίδαυρος
172
- expected: ɛpiðɑvros
173
- - source: Επτάνησα
174
- expected: ɛptɑnisɑ
175
- - source: Ερμούπολη
176
- expected: ɛrmupoli
177
- - source: Εύβοια
178
- expected: ɛviɑ
179
- - source: Ζάκυνθος
180
- expected: zɑkinθos
181
- - source: Ήπειρος
182
- expected: ipiros
183
- - source: Ηράκλειο
184
- expected: irɑklio
185
- - source: Θάσος
186
- expected: θɑsos
187
- - source: Θεσσαλονίκη
188
- expected: θɛsɑloniki
189
- - source: Θεσσαλία
190
- expected: θɛsɑliɑ
191
- - source: Θεσπρωτία
192
- expected: θɛsprotiɑ
193
- - source: Θήβα
194
- expected: θivɑ
195
- - source: Θράκη
196
- expected: θrɑki
197
- - source: Ιθάκη
198
- expected: iθɑki
199
- - source: Ίος
200
- expected: ios
201
- - source: Ιωάννινα
202
- expected: ioɑninɑ
203
- - source: Καβάλα
204
- expected: kɑvɑlɑ
205
- - source: Καλάβρυτα
206
- expected: kɑlɑvritɑ
207
- - source: Καλαμάτα
208
- expected: kɑlɑmɑtɑ
209
- - source: Καλαμπάκα
210
- expected: kɑlɑmbɑkɑ
211
- - source: Καλύβια
212
- expected: kɑliviɑ
213
- - source: Κάλυμνος
214
- expected: kɑlimnos
215
- - source: Καρδίτσα
216
- expected: kɑrðitsɑ
217
- - source: Καρπενήσι
218
- expected: kɑrpɛnisi
219
- - source: Κάρυστος
220
- expected: kɑristos
221
- - source: Καστελλόριζο
222
- expected: kɑstɛlorizo
223
- - source: Καστοριά
224
- expected: kɑstoriɑ
225
- - source: Κατερίνη
226
- expected: kɑtɛrini
227
- - source: Κάτω Αχαΐα
228
- expected: kɑto ɑxɑiɑ
229
- - source: Κερατέα
230
- expected: kɛrɑtɛɑ
231
- - source: Κέρκυρα
232
- expected: kɛrkirɑ
233
- - source: Κεφαλλονιά
234
- expected: kɛfɑloniɑ
235
- - source: Κηφισιά
236
- expected: kifisiɑ
237
- - source: Κιλκίς
238
- expected: kilkis
239
- - source: Κοζάνη
240
- expected: kozɑni
241
- - source: Κολωνός
242
- expected: kolonos
243
- - source: Κομοτηνή
244
- expected: komotini
245
- - source: Κόρινθος
246
- expected: korinθos
247
- - source: Κορώνη
248
- expected: koroni
249
- - source: Κρανίδι
250
- expected: krɑniði
251
- - source: Κρέστενα
252
- expected: krɛstɛnɑ
253
- - source: Κρήτη
254
- expected: kriti
255
- - source: Κύθηρα
256
- expected: kiθirɑ
257
- - source: Κυκλάδες
258
- expected: kiklɑðɛs
259
- - source: Κύμη
260
- expected: kimi
261
- - source: Κυψέλη
262
- expected: kipsɛli
263
- - source: Κως
264
- expected: kos
265
- - source: Λαγκαδάς
266
- expected: lɑŋɡɑðɑs
267
- - source: Λαμία
268
- expected: lɑmiɑ
269
- - source: Λάρισα
270
- expected: lɑrisɑ
271
- - source: Λαύριο
272
- expected: lɑvrio
273
- - source: Λέρος
274
- expected: lɛros
275
- - source: Λέσβος
276
- expected: lɛzvos
277
- - source: Λευκάδα
278
- expected: lɛfkɑðɑ
279
- - source: Λήμνος
280
- expected: limnos
281
- - source: Λιβαδειά
282
- expected: livɑðiɑ
283
- - source: Μακεδονία
284
- expected: mɑkɛðoniɑ
285
- - source: Μάνη
286
- expected: mɑni
287
- - source: Μαραθώνας
288
- expected: mɑrɑθonɑs
289
- - source: Μαρκόπουλο
290
- expected: mɑrkopulo
291
- - source: Μαρούσι
292
- expected: mɑrusi
293
- - source: Μέγαρα
294
- expected: mɛɣɑrɑ
295
- - source: Μεσολόγγι
296
- expected: mɛsoloŋɡi
297
- - source: Μεταξουργείο
298
- expected: mɛtɑksurɣio
299
- - source: Μέτσοβο
300
- expected: mɛtsovo
301
- - source: Μήλος
302
- expected: milos
303
- - source: Μύκονος
304
- expected: mikonos
305
- - source: Μυστράς
306
- expected: mistrɑs
307
- - source: Μυτιλήνη
308
- expected: mitilini
309
- - source: Νάξος
310
- expected: nɑksos
311
- - source: Νάουσα
312
- expected: nɑusɑ
313
- - source: Ναύπακτος
314
- expected: nɑfpɑktos
315
- - source: Ναύπλιο
316
- expected: nɑfplio
317
- - source: Νέα Σμύρνη
318
- expected: nɛɑ zmirni
319
- - source: Νίσυρος
320
- expected: nisiros
321
- - source: Ξάνθη
322
- expected: ksɑnθi
323
- - source: Όλυμπος
324
- expected: olimbos
325
- - source: Παγκράτι
326
- expected: pɑŋɡrɑti
327
- - source: Παπάγου
328
- expected: pɑpɑɣu
329
- - source: Πάρος
330
- expected: pɑros
331
- - source: Πασαλιμάνι
332
- expected: pɑsɑlimɑni
333
- - source: Πατήσια
334
- expected: pɑtisiɑ
335
- - source: Πάτμος
336
- expected: pɑtmos
337
- - source: Πάτρα
338
- expected: pɑtrɑ
339
- - source: Πειραιάς
340
- expected: pirɛɑs
341
- - source: Πελοπόννησος
342
- expected: pɛloponisos
343
- - source: Περιστέρι
344
- expected: pɛristɛri
345
- - source: Πεύκη
346
- expected: pɛfki
347
- - source: Πήλιο
348
- expected: pilio
349
- - source: Πολύγυρος
350
- expected: poliɣiros
351
- - source: Πόρος
352
- expected: poros
353
- - source: Πρέβεζα
354
- expected: prɛvɛzɑ
355
- - source: Πτολεμαΐδα
356
- expected: ptolɛmɑiðɑ
357
- - source: Πύλος
358
- expected: pilos
359
- - source: Πύργος
360
- expected: pirɣos
361
- - source: Ρέθυμνο
362
- expected: rɛθimno
363
- - source: Ρόδος
364
- expected: roðos
365
- - source: Ρούμελη
366
- expected: rumɛli
367
- - source: Σαλαμίνα
368
- expected: sɑlɑminɑ
369
- - source: Σαμοθράκη
370
- expected: sɑmoθrɑki
371
- - source: Σάμος
372
- expected: sɑmos
373
- - source: Σαντορίνη
374
- expected: sɑndorini
375
- - source: Σέρρες
376
- expected: sɛrɛs
377
- - source: Σίκινος
378
- expected: sikinos
379
- - source: Σίφνος
380
- expected: sifnos
381
- - source: Σκιάθος
382
- expected: skiɑθos
383
- - source: Σκόπελος
384
- expected: skopɛlos
385
- - source: Σούλι
386
- expected: suli
387
- - source: Σπάρτη
388
- expected: spɑrti
389
- - source: Στερεά Ελλάδα
390
- expected: stɛrɛɑ ɛlɑðɑ
391
- - source: Στύρα
392
- expected: stirɑ
393
- - source: Σύμη
394
- expected: simi
395
- - source: Σύρος
396
- expected: siros
397
- - source: Σφακιά
398
- expected: sfɑkiɑ
399
- - source: Τήλος
400
- expected: tilos
401
- - source: Τήνος
402
- expected: tinos
403
- - source: Τρίκαλα
404
- expected: trikɑlɑ
405
- - source: Τρίπολη
406
- expected: tripoli
407
- - source: Τσακωνιά
408
- expected: tsɑkoniɑ
409
- - source: Ύδρα
410
- expected: iðrɑ
411
- - source: Φάληρο
412
- expected: fɑliro
413
- - source: Φλώρινα
414
- expected: florinɑ
415
- - source: Φολέγανδρος
416
- expected: folɛɣɑnðros
417
- - source: Χάλκη
418
- expected: xɑlki
419
- - source: Χαλκίδα
420
- expected: xɑlkiðɑ
421
- - source: Χαλάνδρι
422
- expected: xɑlɑnðri
423
- - source: Χαλκιδική
424
- expected: xɑlkiðiki
425
- - source: Χανιά
426
- expected: xɑniɑ
427
- - source: Χίος
428
- expected: xios
429
- - source: Ψαρά
430
- expected: psɑrɑ
431
- - source: Αβάνα
432
- expected: ɑvɑnɑ
433
- - source: Αγγλία
434
- expected: ɑŋɡliɑ
435
- - source: Αϊβαλί
436
- expected: ɑivɑli
437
- - source: Αλεξάνδρεια
438
- expected: ɑlɛksɑnðriɑ
439
- - source: Άμστερνταμ
440
- expected: ɑmstɛrndɑm
441
- - source: Βαυαρία
442
- expected: vɑvɑriɑ
443
- - source: Βενετία
444
- expected: vɛnɛtiɑ
445
- - source: Βερολίνο
446
- expected: vɛrolino
447
- - source: Βερόνα
448
- expected: vɛronɑ
449
- - source: Βιέννη
450
- expected: viɛni
451
- - source: Γένοβα
452
- expected: ɣɛnovɑ
453
- - source: Δουβλίνο
454
- expected: ðuvlino
455
- - source: Καλαβρία
456
- expected: kɑlɑvriɑ
457
- - source: Καλιφόρνια
458
- expected: kɑliforniɑ
459
- - source: Καύκασος
460
- expected: kɑfkɑsos
461
- - source: Κονγκό
462
- expected: konŋɡo
463
- - source: Κορσική
464
- expected: korsiki
465
- - source: Κουρδιστάν
466
- expected: kurðistɑn
467
- - source: Κωνσταντινούπολη
468
- expected: konstɑndinupoli
469
- - source: Κατεχόμενη Κύπρος
470
- expected: kɑtɛxomɛni kipros
471
- - source: Λαπωνία
472
- expected: lɑponiɑ
473
- - source: Λευκωσία
474
- expected: lɛfkosiɑ
475
- - source: Λιβόρνο
476
- expected: livorno
477
- - source: Λονδίνο
478
- expected: lonðino
479
- - source: Λυών
480
- expected: lion
481
- - source: Μάλαγα
482
- expected: mɑlɑɣɑ
483
- - source: Μασσαλία
484
- expected: mɑsɑliɑ
485
- - source: Μικρονησία
486
- expected: mikronisiɑ
487
- - source: Μιλάνο
488
- expected: milɑno
489
- - source: Μόσχα
490
- expected: mosxɑ
491
- - source: Μπολόνια
492
- expected: boloniɑ
493
- - source: Νάπολη
494
- expected: nɑpoli
495
- - source: Νταγκεστάν
496
- expected: dɑŋɡɛstɑn
497
- - source: Νέα Υόρκη
498
- expected: nɛɑ iorki
499
- - source: Οξφόρδη
500
- expected: oksforði
501
- - source: Ουαλία
502
- expected: uɑliɑ
503
- - source: Παρίσι
504
- expected: pɑrisi
505
- - source: Πάφος
506
- expected: pɑfos
507
- - source: Πολυνησία
508
- expected: polinisiɑ
509
- - source: Ρώμη
510
- expected: romi
511
- - source: Σαμάρεια
512
- expected: sɑmɑriɑ
513
- - source: Σικελία
514
- expected: sikɛliɑ
515
- - source: Σκανδιναβία
516
- expected: skɑnðinɑviɑ
517
- - source: Σκόπια
518
- expected: skopiɑ
519
- - source: Σκωτία
520
- expected: skotiɑ
521
- - source: Σμύρνη
522
- expected: zmirni
523
- - source: Ταϊτή
524
- expected: tɑiti
525
- - source: Ταταρστάν
526
- expected: tɑtɑrstɑn
527
- - source: Τζαμάικα
528
- expected: dzɑmɑikɑ
529
- - source: Τηλλυρία
530
- expected: tiliriɑ
531
- - source: Τιρόλο
532
- expected: tirolo
533
- - source: Τορίνο
534
- expected: torino
535
- - source: Φανάρι
536
- expected: fɑnɑri
537
- - source: Φλωρεντία
538
- expected: florɛndiɑ
539
- - source: Χαβάη
540
- expected: xɑvɑi
541
- - source: Χονγκ Κονγκ
542
- expected: xonŋɡ konŋɡ
543
-
544
- map:
545
- downcase: True
546
-
547
- # https://en.wikipedia.org/wiki/Romanization_of_Greek
548
- rules:
549
- - pattern: (?<=[ΑαΕεΗη])\u03A5(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Υ (after Α, Ε, Η)
550
- result: f
551
- - pattern: (?<=[ΑαΕεΗη])\u03A5(?=\b) # Υ (after Α, Ε, Η)
552
- result: f
553
- - pattern: (?<=[ΑαΕεΗη])\u03C5(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # υ (after Α, Ε, Η)
554
- result: f
555
- - pattern: (?<=[ΑαΕεΗη])\u03C5(?=\b) # υ (after Α, Ε, Η)
556
- result: f
557
- - pattern: (?<=[ΑαΕεΗη])\u03A5 # Υ (after Α, Ε, Η)
558
- result: v
559
- - pattern: (?<=[ΑαΕεΗη])\u03C5 # υ (after Α, Ε, Η)
560
- result: v
561
- - pattern: \u0391\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Αύ
562
- result: ɑf
563
- - pattern: \u0391\u03CD(?=\b) # Αύ
564
- result: ɑf
565
- - pattern: \u0391\u03CD # Αύ
566
- result: ɑv
567
- - pattern: \u03B1\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Αύ
568
- result: ɑf
569
- - pattern: \u03B1\u03CD(?=\b) # Αύ
570
- result: ɑf
571
- - pattern: \u03B1\u03CD # Αύ
572
- result: ɑv
573
- - pattern: \u0395\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
574
- result: ɛf
575
- - pattern: \u0395\u03CD(?=\b) # Εύ
576
- result: ɛf
577
- - pattern: \u0395\u03CD # Εύ
578
- result: ɛv
579
- - pattern: \u03B5\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
580
- result: ɛf
581
- - pattern: \u03B5\u03CD(?=\b) # Εύ
582
- result: ɛf
583
- - pattern: \u03B5\u03CD # Εύ
584
- result: ɛv
585
- - pattern: \u0397\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
586
- result: if
587
- - pattern: \u0397\u03CD(?=\b) # Εύ
588
- result: if
589
- - pattern: \u0397\u03CD # Εύ
590
- result: iv
591
- - pattern: \u03B7\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
592
- result: if
593
- - pattern: \u03B7\u03CD(?=\b) # Εύ
594
- result: if
595
- - pattern: \u03B7\u03CD # Εύ
596
- result: iv
597
- - pattern: \u039F[υΥύ] # Υ (after Ο)
598
- result: u
599
- - pattern: \u03BF[υΥύ] # υ (after Ο)
600
- result: u
601
- - pattern: (?<=[ΆάΈέΉήΌό])\u03A5 # Άυ, Έυ, Ήυ, Όυ
602
- result: i
603
- - pattern: (?<=[ΆάΈέΉήΌό])\u03C5 # Άυ, Έυ, Ήυ, Όυ
604
- result: i
605
- - pattern: \u0393(?=[ξΞχΧ]) # Γ (before Γ, Ξ, Χ)
606
- result: n
607
- - pattern: \u03B3(?=[ξΞχΧ]) # γ (before Γ, Ξ, Χ)
608
- result: n
609
- - pattern: (?<!\b)\u0393[Γγ] # Γ (before Γ)
610
- result: ŋɡ
611
- - pattern: (?<!\b)\u03B3\u03B3 # γ (before Γ)
612
- result: ŋɡ
613
- - pattern: (?<!\b)\u0393[Κκ] # Γ (before Κ)
614
- result: ŋɡ
615
- - pattern: (?<!\b)\u03B3[Κκ] # γ (before Κ)
616
- result: ŋɡ
617
- - pattern: (?<=\b)\u0393[Γγ] # Γ (before Γ)
618
- result: ɡ
619
- - pattern: (?<=\b)\u03B3\u03B3 # γ (before Γ)
620
- result: ɡ
621
- - pattern: (?<=\b)\u0393[Κκ] # Γ (before Κ)
622
- result: ɡ
623
- - pattern: (?<=\b)\u03B3[Κκ] # γ (before Κ)
624
- result: ɡ
625
- - pattern: (?<=\b)\u039C[πΠ] # ΜΠ (initially)
626
- result: b
627
- - pattern: (?<=\b)\u03BC[πΠ] # μπ (initially)
628
- result: b
629
- - pattern: \u039C[πΠ](?=\b) # ΜΠ (finally)
630
- result: b
631
- - pattern: \u03BC[πΠ](?=\b) # μπ (finally)
632
- result: b
633
- - pattern: (?<!\b)\u039C[πΠ](?!\b) # ΜΠ (medially)
634
- result: mb
635
- - pattern: (?<!\b)\u03BC[πΠ](?!\b) # μπ (medially)
636
- result: mb
637
- - pattern: (?<=\b)[Νν][ττ] # Ντ (initial)
638
- result: d
639
- - pattern: (?<!\b)[Νν][ττ] # Ντ (medial, final)
640
- result: nd
641
- - pattern: \u03A3(?=[ΒβΓγΔδΖζΛλΜμΝνΡρ]) # Σ (before voiced consonants)
642
- result: z
643
- - pattern: \u03C3(?=[ΒβΓγΔδΖζΛλΜμΝνΡρ]) # Σ (before voiced consonants)
644
- result: z
645
- - pattern: \u0391[Ιιί] # Αι
646
- result: ɛ
647
- - pattern: \u03B1[Ιιί] # αι
648
- result: ɛ
649
- - pattern: \u03A5[Ιιί] # Υι
650
- result: i
651
- - pattern: \u03C5[Ιιί] # υι
652
- result: i
653
- - pattern: \u0395[Ιιί] # Ει
654
- result: i
655
- - pattern: \u03B5[Ιιί] # ει
656
- result: i
657
- - pattern: \u039F[Ιιί] # Οι
658
- result: i
659
- - pattern: \u03BF[Ιιί] # οι
660
- result: i
661
- - pattern: \u03A4[ζΖ] # Τζ
662
- result: dz
663
- - pattern: \u03c4[ζΖ] # Τζ
664
- result: dz
665
- - pattern: \u037E # ;
666
- result: "?"
667
- - pattern: \u003B # ;
668
- result: "?"
669
-
670
- characters:
671
- "\u0027": ""
672
- "\u0386": "ɑ" # Ά
673
- "\u0391": "ɑ" # Α
674
- "\u0392": "v" # Β
675
- "\u0393": "ɣ" # Γ
676
- "\u0394": "ð" # Δ
677
- "\u0395": "ɛ" # Ε
678
- "\u0395\u03AA": "ɛi" # ΕΪ
679
- "\u0395\u03CA": "ɛi" # Εϊ
680
- "\u0388\u03CA": "ɛi" # Έϊ
681
- "\u0396": "z" # Ζ
682
- "\u0397": "i" # Η
683
- "\u0398": "θ" # Θ
684
- "\u0399": "i" # Ι
685
- "\u039A": "k" # Κ
686
- "\u039B": "l" # Λ
687
- "\u039C": "m" # Μ
688
- "\u039D": "n" # Ν
689
- "\u039E": "ks" # Ξ
690
- "\u039F": "o" # Ο
691
- "\u03A0": "p" # Π
692
- "\u03A1": "r" # Ρ
693
- "\u03A3": "s" # Σ
694
- "\u03A4": "t" # Τ
695
- "\u03A5": "i" # Υ
696
- "\u03A6": "f" # Φ
697
- "\u03A7": "x" # Χ
698
- "\u03A8": "ps" # Ψ
699
- "\u03A9": "o" # Ω
700
- "\u0388": "ɛ" # Έ
701
- "\u0389": "i" # Ή
702
- "\u038A": "i" # Ί
703
- "\u038C": "o" # Ό
704
- "\u038E": "i" # Ύ
705
- "\u038F": "o" # Ώ
706
- "\u03AA": "i" # Ϊ
707
- "\u03AB": "i" # Ϋ
708
-
709
- "\u03AC": "ɑ" # ά
710
- "\u03B1": "ɑ" # α
711
- "\u03B2": "v" # β
712
- "\u03B3": "ɣ" # γ
713
- "\u03B4": "ð" # δ
714
- "\u03B5": "ɛ" # ε
715
- "\u03B5\u03CA": "ɛi" # εϊ
716
- "\u03AD\u03CA": "ɛi" # έϊ
717
- "\u03AD\u03B9": "ɛi" # έι
718
- "\u03B6": "z" # ζ
719
- "\u03B7": "i" # η
720
- #"\u03B8": "θ" # θ
721
- "\u03B9": "i" # ι
722
- "\u03BA": "k" # κ
723
- "\u03BB": "l" # λ
724
- "\u03BC": "m" # μ
725
- "\u03BD": "n" # ν
726
- "\u03BE": "ks" # ξ
727
- "\u03BF": "o" # ο
728
- "\u03C0": "p" # π
729
- "\u03C1": "r" # ρ
730
- "\u03C3": "s" # σ
731
- "\u03C2": "s" # ς
732
- "\u03C4": "t" # τ
733
- "\u03C5": "i" # υ
734
- "\u03C6": "f" # φ
735
- "\u03C7": "x" # χ
736
- "\u03C8": "ps" # ψ
737
- "\u03C9": "o" # ω
738
- "\u03AD": "ɛ" # έ
739
- "\u03AE": "i" # ή
740
- "\u03AF": "i" # ί
741
- "\u03CC": "o" # ό
742
- "\u03CD": "i" # ύ
743
- "\u03CE": "o" # ώ
744
- "\u03CA": "i" # ϊ
745
- "\u03CB": "i" # ϋ
746
- "\u0390": "i" # ΐ
747
- "\u03B0": "i" # ΰ
748
-
749
- "\u0387": ";" # ·
750
- "\u00B7": ";" # ·
751
-
752
- postrules:
753
- - pattern: vv
754
- result: "v"
755
- - pattern: ðð
756
- result: "ð"
757
- - pattern: zz
758
- result: "z"
759
- - pattern: θθ
760
- result: "θ"
761
- - pattern: kk
762
- result: "k"
763
- - pattern: ll
764
- result: "l"
765
- - pattern: mm
766
- result: "m"
767
- - pattern: nn
768
- result: "n"
769
- - pattern: pp
770
- result: "p"
771
- - pattern: rr
772
- result: "r"
773
- - pattern: ss
774
- result: "s"
775
- - pattern: tt
776
- result: "t"
777
- - pattern: ff
778
- result: "f"
779
- - pattern: xx
780
- result: "x"