interscript 0.1.9 → 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (352) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +53 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +5 -0
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/bin/setup +8 -0
  19. data/exe/interscript +6 -0
  20. data/interscript.gemspec +31 -0
  21. data/lib/interscript.rb +80 -135
  22. data/lib/interscript/command.rb +5 -5
  23. data/lib/interscript/compiler.rb +22 -0
  24. data/lib/interscript/compiler/javascript.rb +292 -0
  25. data/lib/interscript/compiler/ruby.rb +262 -0
  26. data/lib/interscript/dsl.rb +67 -0
  27. data/lib/interscript/dsl/aliases.rb +23 -0
  28. data/lib/interscript/dsl/document.rb +46 -0
  29. data/lib/interscript/dsl/group.rb +45 -0
  30. data/lib/interscript/dsl/group/parallel.rb +6 -0
  31. data/lib/interscript/dsl/items.rb +89 -0
  32. data/lib/interscript/dsl/metadata.rb +26 -0
  33. data/lib/interscript/dsl/stage.rb +6 -0
  34. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  35. data/lib/interscript/dsl/tests.rb +12 -0
  36. data/lib/interscript/interpreter.rb +251 -0
  37. data/lib/interscript/node.rb +25 -0
  38. data/lib/interscript/node/alias_def.rb +15 -0
  39. data/lib/interscript/node/dependency.rb +13 -0
  40. data/lib/interscript/node/document.rb +45 -0
  41. data/lib/interscript/node/group.rb +34 -0
  42. data/lib/interscript/node/group/parallel.rb +9 -0
  43. data/lib/interscript/node/group/sequential.rb +2 -0
  44. data/lib/interscript/node/item.rb +52 -0
  45. data/lib/interscript/node/item/alias.rb +42 -0
  46. data/lib/interscript/node/item/any.rb +61 -0
  47. data/lib/interscript/node/item/capture.rb +50 -0
  48. data/lib/interscript/node/item/group.rb +51 -0
  49. data/lib/interscript/node/item/repeat.rb +40 -0
  50. data/lib/interscript/node/item/stage.rb +23 -0
  51. data/lib/interscript/node/item/string.rb +51 -0
  52. data/lib/interscript/node/metadata.rb +18 -0
  53. data/lib/interscript/node/rule.rb +6 -0
  54. data/lib/interscript/node/rule/funcall.rb +18 -0
  55. data/lib/interscript/node/rule/run.rb +15 -0
  56. data/lib/interscript/node/rule/sub.rb +65 -0
  57. data/lib/interscript/node/stage.rb +19 -0
  58. data/lib/interscript/node/tests.rb +15 -0
  59. data/lib/interscript/stdlib.rb +211 -0
  60. data/lib/interscript/utils/regexp_converter.rb +283 -0
  61. data/lib/interscript/version.rb +1 -1
  62. data/requirements.txt +1 -0
  63. metadata +73 -458
  64. data/README.adoc +0 -296
  65. data/aliases.json +0 -1
  66. data/lib/g2pwrapper.py +0 -34
  67. data/lib/interscript/fs.rb +0 -96
  68. data/lib/interscript/mapping.rb +0 -144
  69. data/lib/interscript/opal.rb +0 -196
  70. data/lib/interscript/opal/entrypoint.rb +0 -20
  71. data/lib/interscript/opal/exports.rb +0 -11
  72. data/lib/interscript/opal/maps.js.erb +0 -8
  73. data/lib/model-7 +0 -0
  74. data/lib/tha-pt-b-7 +0 -0
  75. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
  76. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
  77. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  78. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
  79. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
  80. data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
  81. data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
  82. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
  83. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
  84. data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
  85. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  86. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
  87. data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
  88. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
  89. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
  90. data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
  91. data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
  92. data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
  93. data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
  94. data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
  95. data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
  96. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  97. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
  98. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
  99. data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
  100. data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
  101. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
  102. data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
  103. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  104. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  105. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
  106. data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
  107. data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
  108. data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
  109. data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
  110. data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
  111. data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
  112. data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
  113. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
  114. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  115. data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
  116. data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
  117. data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
  118. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
  119. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  120. data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
  121. data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
  122. data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
  123. data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
  124. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
  125. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  126. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  127. data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
  128. data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
  129. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  130. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  131. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  132. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
  133. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  134. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  135. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  136. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
  137. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
  138. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  139. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
  140. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
  141. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
  142. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
  143. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
  144. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
  145. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
  146. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
  147. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
  148. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
  149. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
  150. data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
  151. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
  152. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  153. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
  154. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  155. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
  156. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
  157. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  158. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  159. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  160. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
  161. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
  162. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  163. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
  164. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
  165. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
  166. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
  167. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
  168. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
  169. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
  170. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
  171. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
  172. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
  173. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
  174. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
  175. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
  176. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
  177. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
  178. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
  179. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
  180. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  181. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  182. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  183. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  184. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
  185. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
  186. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  187. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
  188. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  189. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  190. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  191. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
  192. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  193. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
  194. data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
  195. data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
  196. data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
  197. data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
  198. data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
  199. data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
  200. data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
  201. data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
  202. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
  203. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  204. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  205. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  206. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  207. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
  208. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  209. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  210. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
  211. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
  212. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  213. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  214. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  215. data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
  216. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  217. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  218. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  219. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  220. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  221. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  222. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
  223. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
  224. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
  225. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
  226. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
  227. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
  228. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
  229. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
  230. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
  231. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
  232. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
  233. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
  234. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
  235. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
  236. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
  237. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
  238. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
  239. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
  240. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
  241. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
  242. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
  243. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
  244. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
  245. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  246. data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
  247. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
  248. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
  249. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  250. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
  251. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  252. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
  253. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
  254. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  255. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
  256. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  257. data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
  258. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  259. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  260. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  261. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  262. data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
  263. data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
  264. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  265. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  266. data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
  267. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  268. data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
  269. data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
  270. data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
  271. data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
  272. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  273. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  274. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  275. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  276. data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
  277. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
  278. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  279. data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
  280. data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
  281. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  282. data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
  283. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  284. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  285. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  286. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
  287. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  288. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
  289. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  290. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  291. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  292. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
  293. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  294. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
  295. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
  296. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
  297. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
  298. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
  299. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  300. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
  301. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
  302. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
  303. data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
  304. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  305. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  306. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  307. data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
  308. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  309. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  310. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
  311. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  312. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  313. data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
  314. data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
  315. data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
  316. data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
  317. data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
  318. data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
  319. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
  320. data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
  321. data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
  322. data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
  323. data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
  324. data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
  325. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  326. data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
  327. data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
  328. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
  329. data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
  330. data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
  331. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
  332. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
  333. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
  334. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  335. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  336. data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
  337. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  338. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  339. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  340. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
  341. data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
  342. data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
  343. data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
  344. data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
  345. data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
  346. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  347. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  348. data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
  349. data/spec/interscript/filenames_spec.rb +0 -21
  350. data/spec/interscript/mapping_spec.rb +0 -42
  351. data/spec/interscript_spec.rb +0 -37
  352. data/spec/spec_helper.rb +0 -3
@@ -1,184 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 2008
4
- language: iso-639-2:che
5
- source_script: Cyrl
6
- destination_script: Latn
7
- name: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/835782/TABLE_OF_CORRESPONDENCES_FOR_CHECHEN.pdf
8
- creation_date: 2008
9
- confirmation_date: 2019-07
10
- description: |
11
- Chechen is an official language within Chechnya, one of the republics of the Russian Federation.
12
- It will normally be encountered in Cyrillic script, in which case it should be romanized by means of
13
- the Cyrillic-Roman table of correspondences given below.
14
-
15
- notes:
16
- - The letter ə is used to represent short a; a is used for long a.
17
- - Ye is used word- and syllable-initially. This Cyrillic letter may be encountered as the ligature ie in Chechen-Roman sources.
18
- - This character occurs only in loan words.
19
- - q in the combination ккх (qq) and q̇in the combination ккъ (q̇q̇)
20
- - ŋ when preceding vowel is nasalized.
21
- - This Cyrillic letter may be encountered as the ligature ꭣ [U+AB63] or the diphthong oa in Chechen Roman sources.
22
- - Unless in the combinations гӀ, кӀ, пӀ, тӀ, хӀ, цӀ and чӀ.
23
- - |
24
- An inventory of letter-diacritic combinations, with their Unicode encoding, in addition to the
25
- unmodified letters of the basic Roman script is:
26
-
27
- All apostrophes appearing in romanization are U+2019
28
-
29
- Ə (U+018F) ə (U+0259)
30
- Ä (U+00C4) ä (U+00E4)
31
- Ġ (U+0047+0307) ġ (U+0067+0307)
32
- Z̵ (U+005A+0335) z̵ (U+007A+0335)
33
- Q̇ (U+0051+0307) q̇ (U+0071+0307)
34
- Ŋ (U+014A) ŋ (U+014B)
35
- Ö (U+00D6) ö (U+00F6)
36
- Ü (U+00DC) ü (U+00FC)
37
- Ẋ (U+0058+0307) ẋ (U+0078+0307)
38
- Ċ (U+0043+0307) ċ (U0063+0307)
39
- Ç (U+00C7) ç (U+00E7)
40
- Ç̇ (U+00C7+0307) ç̇ (U+00E7+0307)
41
- Ş (U+015E) ş (U+015F)
42
-
43
- - The Roman-script columns show only lowercase forms but, when applying the table, uppercase and lowercase Roman letters as appropriate should be used
44
-
45
- tests:
46
- - source: кӏант
47
- expected: khant
48
- - source: зуда
49
- expected: zuda
50
- - source: пхьагал
51
- expected: pẋagal
52
- - source: наж
53
- expected: naz̵
54
- - source: мангал
55
- expected: mangal
56
- - source: Ӏаж
57
- expected: Jaz̵
58
- - source: Нохчийн Википеди
59
- expected: Noxçiyn Vikipedi
60
- - source: сагӏадаккхар
61
- expected: saġadaqqar
62
- - source: йеза
63
- expected: yeza
64
- - source: еара
65
- expected: yeara
66
- - source: елха
67
- expected: yelxa
68
-
69
- map:
70
- rules:
71
- # note[2]
72
- - pattern: (?<!\b\u2019)\b\u0415 # Е in initial position -> Ye
73
- result: Ye
74
- - pattern: (?<!\b\u2019)\b\u0435 # е in initial position -> ye
75
- result: ye
76
- # note[4]
77
- - pattern: \u043A\u043A\u0445
78
- result: qq
79
- - pattern: \u043A\u043A\u042A
80
- result: q̇q̇
81
- - pattern: \u041A\u041A\u0445
82
- result: QQ
83
- - pattern: \u041A\u041A\u042A
84
- result: Q̇Q̇
85
-
86
- characters:
87
- '\u0410' : ['A', 'Ə'] # А note[1]
88
- '\u0410\u044C' : "A\u0308" # Аь -> Ä
89
- '\u0411' : 'B' # Б
90
- '\u0412' : 'V' # В
91
- '\u0413' : 'G' # Г
92
- '\u0413\u04C0' : "G\u0307" # ГӀ -> Ġ
93
- '\u0414' : 'D' # Д
94
- '\u0415' : 'E' # Е note[2]
95
- '\u0401' : 'Yo' # Ё note[3]
96
- '\u0416' : "Z\u0335" # Ж -> Ƶ
97
- '\u0417' : 'Z' # З
98
- '\u0418' : 'I' # И
99
- '\u042B' : 'Y' # Й
100
- '\u041A' : 'K' # К note[4]
101
- '\u041A\u0445' : 'Q' # Кх note[4]
102
- '\u041A\u044A' : "Q\u0307" # Къ -> Q̇ note[4]
103
- '\u041A\u04C0' : 'Kh' # КӀ note[4]
104
- '\u041B' : 'L' # Л
105
- '\u041C' : 'M' # М
106
- '\u041D' : ['N', 'Ŋ'] # Н note[5]
107
- '\u041E' : 'O' # О note[6]
108
- '\u041E\u044C' : "O\u0308" # Оь -> Ö
109
- '\u041F' : 'P' # П
110
- '\u041F\u04C0' : 'Ph' # ПӀ
111
- '\u0420' : 'R' # Р
112
- '\u0421' : 'S' # С
113
- '\u0422' : 'T' # Т
114
- '\u0422\u04C0' : 'Th' # TӀ
115
- '\u0423' : 'U' # У
116
- '\u0423\u044C' : "U\u0308" # Уь -> Ü
117
- '\u0424' : 'F' # Ф
118
- '\u0425' : 'X' # Х
119
- '\u0425\u044C' : "X\u0307" # Хь -> Ẋ
120
- '\u0425\u04C0' : "H" # ХӀ
121
- '\u04B8' : 'C' # Ц
122
- '\u04B8\u04C0' : "C\u0307" # ЦӀ -> Ċ
123
- '\u0427' : "C\u0327" # Ч -> Ç
124
- '\u0427\u04C0' : "\u00C7\u0307" # ЧӀ -> Ç̇
125
- '\u0428' : "S\u0327" # Ш -> Ş
126
- '\u0429' : "S\u0327C\u0327" # Щ -> ŞÇ note[3]
127
- '\u042A' : "’" # Ъ note[3]
128
- '\u042B' : "Y" # Ы
129
- '\u042C' : "" # Ь note[3]
130
- '\u042D' : "E" # Э
131
- '\u042E' : "Yu" # Ю
132
- '\u042E\u044C' : "Yu\u0308" # Юь -> Yü
133
- '\u042F' : "Ya" # Я
134
- '\u042F\u044C' : "Ya\u0308" # Яь -> Yä
135
- '\u04C0' : "J" # Ӏ note[7]
136
-
137
- '\u0430' : ['a', 'ə'] # а note[1]
138
- '\u0430\u044C' : "a\u0308" # аь -> ä
139
- '\u0431' : 'b' # б
140
- '\u0432' : 'v' # в
141
- '\u0433' : 'g' # г
142
- '\u0433\u04CF' : "g\u0307" # гӏ -> ġ
143
- '\u0434' : 'd' # д
144
- '\u0435' : 'e' # е note[2]
145
- '\u0451' : 'yo' # ё note[3]
146
- '\u0436' : "z\u0335" # ж -> ƶ
147
- '\u0437' : 'z' # з
148
- '\u0438' : 'i' # и
149
- '\u0439' : 'y' # й
150
- '\u043A' : 'k' # к note[4]
151
- '\u043A\u0445' : 'q' # кх note[4]
152
- '\u043A\u044A' : "q\u0307" # къ -> q̇ note[4]
153
- '\u043A\u04CF' : 'kh' # кӏ note[4]
154
- '\u043B' : 'l' # л
155
- '\u043C' : 'm' # м
156
- '\u043D' : ['n', 'ŋ'] # н note[5]
157
- '\u043E' : 'o' # о note[6]
158
- '\u043E\u044C' : "o\u0308" # оь -> ö
159
- '\u043F' : 'p' # п
160
- '\u0440' : 'r' # р
161
- '\u0441' : 's' # с
162
- '\u0442' : 't' # т
163
- '\u0442\u04CF' : 'th' # тӏ
164
- '\u0443' : 'u' # у
165
- '\u0443\u044C' : "u\u0308" # Уь -> ü
166
- '\u0444' : 'f' # ф
167
- '\u0445' : 'x' # х
168
- '\u0445\u044C' : "x\u0307" # хь -> ẋ
169
- '\u0445\u04CF' : "h" # хӏ
170
- '\u04B9' : 'c' # ц
171
- '\u04B9\u04CF' : "с\u0307" # цӏ -> ċ
172
- '\u0447' : "c\u0327" # ч -> ç
173
- '\u0447\u04CF' : "c\u00E7\u0307" # чӏ -> ç̇
174
- '\u0448' : "s\u0327" # ш -> ş
175
- '\u0449' : "s\u0327c\u0327" # щ -> şç note[3]
176
- '\u044A' : "’" # ъ note[3]
177
- '\u044B' : "y" # ы
178
- '\u044C' : '' # ь note[3]
179
- '\u044D' : "e" # э
180
- '\u044E' : "yu" # ю
181
- '\u044E' : "yu\u0308" # юь -> yü
182
- '\u044F' : "ya" # я
183
- '\u044F' : "ya\u0308" # яь -> yä
184
- '\u04CF' : "j" # ӏ note[7]
@@ -1,75 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 1988
4
- language: iso-639-2:div
5
- source_script: Thaa
6
- destination_script: Latn
7
- name: ROMANIZATION OF MALDIVIAN BGN/PCGN 1988 Agreement, with modifications 2009
8
- alias:
9
- ogc11122:
10
- code: div_Thaa2Latn_GMV_1988
11
- description: Maldivian (Divehi) 1988 system
12
- url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816778/ROMANIZATION_OF_MALDIVIAN.pdf
13
- creation_date: 1988
14
- confirmation_date: 2019
15
- description: |
16
- This romanization system supersedes the one that was approved by BGN and PCGN in 1972. An
17
- official system was submitted to PCGN by the Maldivian government in 1987 and approved by BGN and
18
- PCGN in 1988. The system presented here reflects the 1988 Agreement with minor modifications introduced by the government of the Maldives in 2009
19
-
20
- notes:
21
- - Maldivian is read from right to left.
22
- - The symbol ◌ appearing in the Vowel Characters table represents any Maldivian consonant character.
23
- - The character އ is not romanized. If it bears a vowel character, that vowel character alone is romanized (e.g. އެނބޫދޫ En’boodhoo).
24
- - |
25
- When characters ށ and އ appear in combination with a supercircle (the ‘sukun’, which usually marks
26
- the absence of a vowel, see the Diacritical Mark table): ށ ; އ , these characters are not romanized
27
- but the following consonant is doubled (e.g. ކަޅުހުރާ Kalhehuttaa), unless the following consonant is a digraph in the
28
- romanized form, in which case they are romanized h (e.g. ކެރެށްދޫ Kerehdhoo). ށ and އ appearing at the end of a word are romanized h (e.g. ވޭވައް Veyvah).
29
- - Noonu (ނ) is romanized n’ when appearing without any vowel or auxiliary sign (e.g. ކަނޑުފުށި Kan’dufushi)
30
- - Thaa (ތ) is romanized iy when appearing in combination with a supercircle (ތ) ,( e.g. ޒިޔާރަތްފުށި Ziyaaraiyfushi).
31
- - The Roman-script columns show only lowercase forms but, when applying the table, uppercase and
32
- lowercase Roman letters as appropriate should be used.
33
-
34
-
35
- tests:
36
- - source: "އިރުގައި"
37
- expected: "irugai"
38
- - source: "ޒިޔާރަތްފުށި"
39
- expected: "ziyaaraiyfushi"
40
- - source: "ރައްކާތެރިކުރުމާއި"
41
- expected: "rakkaatherikurumaai"
42
- - source: "ޝަހީދުންގެ ދުވަސް"
43
- expected: "sh’aheedhun’ge dhuvas"
44
- - source: "މަރުޙަބާ"
45
- expected: "maruh’abaa"
46
- - source: "ކިހިނެހް"
47
- expected: "kihin’eh"
48
- - source: "ކޮން ނަމެއް ކިޔަނީ"
49
- expected: "kon’ n’ameh kiyan’ee"
50
- - source: "ބައްއަޖޖެވުރި ހެނދުނެހް"
51
- expected: "baajjevuri hen’dhun’eh"
52
- - source: "މެނދުރެހް"
53
- expected: "men’dhureh"
54
- - source: "ހަވީރެހް"
55
- expected: "haveereh"
56
-
57
- map:
58
- inherit: mv-div-Thaa-Latn-1987
59
- characters:
60
- #Consonants with diacritical marks (used mainly in words of Arabic origin, corresponding
61
- # Arabic characters and their romanizations are shown in parentheses)
62
- "ޘ": "th’"
63
- "ޙ": "h’"
64
- "ޚ": "kh"
65
- "ޛ": "dh’"
66
- "ޜ": "x"
67
- "ޝ": "sh’"
68
- "ޞ": "s’"
69
- "ޟ": "l’"
70
- "ޠ": "t’"
71
- "ޡ": "z’"
72
- "ޢ": "’"
73
- "ޣ": "gh"
74
- "ޤ": "q"
75
- "ޥ": "w"
@@ -1,705 +0,0 @@
1
- ---
2
- authority_id: bgnpcgn
3
- id: 1962
4
- language: iso-639-2:ell
5
- source_script: Grek
6
- destination_script: Latn
7
- name: BGN/PCGN 1962 System
8
- alias:
9
- ogc11122:
10
- code: ell_Grek2Latn_BGN_1962
11
- description: US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) Greek 1962 System (out of date)
12
- url: https://github.com/riboseinc/interscript/files/4225556/BGN_Romanization_Guide_1962_greek.pdf
13
- creation_date: 1962
14
- description: |
15
- BGN/PCGN Romanization table for Greek
16
-
17
- note:
18
- - Original specification is for polytonic Greek; this has been adapted for monotonic Greek
19
- - The treatment of έι in https://transliteration.eki.ee/pdf/Greek.pdf is incorrect; although
20
- not explicitly discussed in the original specification, έι is phonetically equivalent to
21
- έϊ, and is to be transliterated as eï, not í (like εί). The same applies to other diphthongs
22
- accented on the first syllable.
23
-
24
- tests:
25
-
26
- - source: |
27
- Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
28
-
29
- Γιάννης Μακρυγιάννης.
30
-
31
- expected: |
32
- Éna práma mónon me parakínise ki eména na grápso óti toútin tin patrídha tin ékhomen óloi mazí, kai sofoí ki amathís kai ploúsioi kai ftokhoí kai politikoí kai stratiotikoí kai oi pléon mikróteroi ánthropoi; ósoi agonistíkamen, analógos o kathís, ékhomen na zísomen edhó. To loipón dhoulépsamen óloi mazí, na tin filámen ki óloi mazí kai na min léyi oúte o dhinatós «egó» oúte o adhínatos. Xérete póte na léyi o kathís «egó»? Ótan agonistí mónos tou kai fkiási í khalási, na léyi «egó»; ótan ómos agonízondai polloí kai fkiánoun, tóte na léne «emís». Ímaste is to «emís» ki ókhi is to «egó». Kai is to exís na máthomen gnósi, an thélomen na fkiásomen khorión, na zísomen óloi mazí.
33
-
34
- Yiánnis Makriyiánnis.
35
-
36
-
37
- - source: ΑΘΗΝΑ
38
- expected: ATHINA
39
- - source: μπαμπάκι
40
- expected: bambáki
41
- - source: νταντά
42
- expected: dandá
43
- - source: γκέγκε
44
- expected: génge
45
- - source: Γκαμπόν
46
- expected: Gambón
47
- - source: Μάγχη
48
- expected: Mánkhi
49
- - source: κογξ
50
- expected: konx
51
- - source: υιός
52
- expected: iós
53
- - source: Υιός
54
- expected: Iós
55
- - source: νεράντζι
56
- expected: nerántzi
57
- - source: Γοίθιος
58
- expected: Goíthios
59
- - source: μπέικον
60
- expected: béïkon
61
- - source: μπέϊκον
62
- expected: béïkon
63
- - source: βόλεϊ
64
- expected: vóleï
65
- - source: αθεΐα
66
- expected: atheḯa
67
- - source: Εϊγιαφιάτλαγιοκουτλ
68
- expected: Eïyiafiátlayiokoutl
69
- - source: Εΐτζι
70
- expected: Eḯtzi
71
- - source: Μυρτώο
72
- expected: Mirtóö
73
- - source: αέρας
74
- expected: aë́ras
75
- - source: γαυ γαυ
76
- expected: gav gav
77
- - source: Ταΰγετος
78
- expected: Taḯyetos
79
- - source: σπρέυ
80
- expected: spréi
81
-
82
- - source: Αθήνα
83
- expected: Athína
84
- - source: Άγιον Όρος
85
- expected: Áyion Óros
86
- - source: Άγραφα
87
- expected: Ágrafa
88
- - source: Αγρίνιο
89
- expected: Agrínio
90
- - source: Αίγινα
91
- expected: Aíyina
92
- - source: Αίγιο
93
- expected: Aíyio
94
- - source: Αλεξανδρούπολη
95
- expected: Alexandroúpoli
96
- - source: Αλεποχώρι
97
- expected: Alepokhóri
98
- - source: Αμοργός
99
- expected: Amorgós
100
- - source: Άμφισσα
101
- expected: Ámfissa
102
- - source: Αράχωβα
103
- expected: Arákhova
104
- - source: Άργος
105
- expected: Árgos
106
- - source: Αρκαδία
107
- expected: Arkadhía
108
- - source: Άρτα
109
- expected: Árta
110
- - source: Βελούχι
111
- expected: Veloúkhi
112
- - source: Βέροια
113
- expected: Véroia
114
- - source: Βοιωτία
115
- expected: Voiotía
116
- - source: Βόλος
117
- expected: Vólos
118
- - source: Βόνιτσα
119
- expected: Vónitsa
120
- - source: Γαλαξίδι
121
- expected: Galaxídhi
122
- - source: Γαλάτσι
123
- expected: Galátsi
124
- - source: Γιαννιτσά
125
- expected: Yiannitsá
126
- - source: Γλυφάδα
127
- expected: Glifádha
128
- - source: Γρανίτσα
129
- expected: Granítsa
130
- - source: Γρεβενά
131
- expected: Grevená
132
- - source: Γύθειο
133
- expected: Yíthio
134
- - source: Διόνυσος
135
- expected: Dhiónisos
136
- - source: Δίστομο
137
- expected: Dhístomo
138
- - source: Δολιανά
139
- expected: Dholianá
140
- - source: Δράμα
141
- expected: Dhráma
142
- - source: Δωδεκάνησα
143
- expected: Dhodhekánisa
144
- - source: Έδεσσα
145
- expected: Édhessa
146
- - source: Ελευσίνα
147
- expected: Elevsína
148
- - source: Επίδαυρος
149
- expected: Epídhavros
150
- - source: Επτάνησα
151
- expected: Eptánisa
152
- - source: Ερμούπολη
153
- expected: Ermoúpoli
154
- - source: Εύβοια
155
- expected: Évvoia
156
- - source: Ζάκυνθος
157
- expected: Zákinthos
158
- - source: Ήπειρος
159
- expected: Ípiros
160
- - source: Ηράκλειο
161
- expected: Iráklio
162
- - source: Θάσος
163
- expected: Thásos
164
- - source: Θεσσαλονίκη
165
- expected: Thessaloníki
166
- - source: Θεσσαλία
167
- expected: Thessalía
168
- - source: Θεσπρωτία
169
- expected: Thesprotía
170
- - source: Θήβα
171
- expected: Thíva
172
- - source: Θράκη
173
- expected: Thráki
174
- - source: Ιθάκη
175
- expected: Itháki
176
- - source: Ίος
177
- expected: Íos
178
- - source: Ιωάννινα
179
- expected: Ioánnina
180
- - source: Καβάλα
181
- expected: Kavála
182
- - source: Καλάβρυτα
183
- expected: Kalávrita
184
- - source: Καλαμάτα
185
- expected: Kalamáta
186
- - source: Καλαμπάκα
187
- expected: Kalambáka
188
- - source: Καλύβια
189
- expected: Kalívia
190
- - source: Κάλυμνος
191
- expected: Kálimnos
192
- - source: Καρδίτσα
193
- expected: Kardhítsa
194
- - source: Καρπενήσι
195
- expected: Karpenísi
196
- - source: Κάρυστος
197
- expected: Káristos
198
- - source: Καστελλόριζο
199
- expected: Kastellórizo
200
- - source: Καστοριά
201
- expected: Kastoriá
202
- - source: Κατερίνη
203
- expected: Kateríni
204
- - source: Κάτω Αχαΐα
205
- expected: Káto Akhaḯa
206
- - source: Κερατέα
207
- expected: Keratéa
208
- - source: Κέρκυρα
209
- expected: Kérkira
210
- - source: Κεφαλλονιά
211
- expected: Kefalloniá
212
- - source: Κηφισιά
213
- expected: Kifisiá
214
- - source: Κιλκίς
215
- expected: Kilkís
216
- - source: Κοζάνη
217
- expected: Kozáni
218
- - source: Κολωνός
219
- expected: Kolonós
220
- - source: Κομοτηνή
221
- expected: Komotiní
222
- - source: Κόρινθος
223
- expected: Kórinthos
224
- - source: Κορώνη
225
- expected: Koróni
226
- - source: Κρανίδι
227
- expected: Kranídhi
228
- - source: Κρέστενα
229
- expected: Kréstena
230
- - source: Κρήτη
231
- expected: Kríti
232
- - source: Κύθηρα
233
- expected: Kíthira
234
- - source: Κυκλάδες
235
- expected: Kikládhes
236
- - source: Κύμη
237
- expected: Kími
238
- - source: Κυψέλη
239
- expected: Kipséli
240
- - source: Κως
241
- expected: Kos
242
- - source: Λαγκαδάς
243
- expected: Langadhás
244
- - source: Λαμία
245
- expected: Lamía
246
- - source: Λάρισα
247
- expected: Lárisa
248
- - source: Λαύριο
249
- expected: Lávrio
250
- - source: Λέρος
251
- expected: Léros
252
- - source: Λέσβος
253
- expected: Lésvos
254
- - source: Λευκάδα
255
- expected: Levkádha
256
- - source: Λήμνος
257
- expected: Límnos
258
- - source: Λιβαδειά
259
- expected: Livadhiá
260
- - source: Μακεδονία
261
- expected: Makedhonía
262
- - source: Μάνη
263
- expected: Máni
264
- - source: Μαραθώνας
265
- expected: Marathónas
266
- - source: Μαρκόπουλο
267
- expected: Markópoulo
268
- - source: Μαρούσι
269
- expected: Maroúsi
270
- - source: Μέγαρα
271
- expected: Mégara
272
- - source: Μεσολόγγι
273
- expected: Mesolóngi
274
- - source: Μεταξουργείο
275
- expected: Metaxouryío
276
- - source: Μέτσοβο
277
- expected: Métsovo
278
- - source: Μήλος
279
- expected: Mílos
280
- - source: Μύκονος
281
- expected: Míkonos
282
- - source: Μυστράς
283
- expected: Mistrás
284
- - source: Μυτιλήνη
285
- expected: Mitilíni
286
- - source: Νάξος
287
- expected: Náxos
288
- - source: Νάουσα
289
- expected: Náousa
290
- - source: Ναύπακτος
291
- expected: Návpaktos
292
- - source: Ναύπλιο
293
- expected: Návplio
294
- - source: Νέα Σμύρνη
295
- expected: Néa Smírni
296
- - source: Νίσυρος
297
- expected: Nísiros
298
- - source: Ξάνθη
299
- expected: Xánthi
300
- - source: Όλυμπος
301
- expected: Ólimbos
302
- - source: Παγκράτι
303
- expected: Pangráti
304
- - source: Παπάγου
305
- expected: Papágou
306
- - source: Πάρος
307
- expected: Páros
308
- - source: Πασαλιμάνι
309
- expected: Pasalimáni
310
- - source: Πατήσια
311
- expected: Patísia
312
- - source: Πάτμος
313
- expected: Pátmos
314
- - source: Πάτρα
315
- expected: Pátra
316
- - source: Πειραιάς
317
- expected: Piraiás
318
- - source: Πελοπόννησος
319
- expected: Pelopónnisos
320
- - source: Περιστέρι
321
- expected: Peristéri
322
- - source: Πεύκη
323
- expected: Pévki
324
- - source: Πήλιο
325
- expected: Pílio
326
- - source: Πολύγυρος
327
- expected: Políyiros
328
- - source: Πόρος
329
- expected: Póros
330
- - source: Πρέβεζα
331
- expected: Préveza
332
- - source: Πτολεμαΐδα
333
- expected: Ptolemaḯdha
334
- - source: Πύλος
335
- expected: Pílos
336
- - source: Πύργος
337
- expected: Pírgos
338
- - source: Ρέθυμνο
339
- expected: Réthimno
340
- - source: Ρόδος
341
- expected: Ródhos
342
- - source: Ρούμελη
343
- expected: Roúmeli
344
- - source: Σαλαμίνα
345
- expected: Salamína
346
- - source: Σαμοθράκη
347
- expected: Samothráki
348
- - source: Σάμος
349
- expected: Sámos
350
- - source: Σαντορίνη
351
- expected: Sandoríni
352
- - source: Σέρρες
353
- expected: Sérres
354
- - source: Σίκινος
355
- expected: Síkinos
356
- - source: Σίφνος
357
- expected: Sífnos
358
- - source: Σκιάθος
359
- expected: Skiáthos
360
- - source: Σκόπελος
361
- expected: Skópelos
362
- - source: Σούλι
363
- expected: Soúli
364
- - source: Σπάρτη
365
- expected: Spárti
366
- - source: Στερεά Ελλάδα
367
- expected: Stereá Elládha
368
- - source: Στύρα
369
- expected: Stíra
370
- - source: Σύμη
371
- expected: Sími
372
- - source: Σύρος
373
- expected: Síros
374
- - source: Σφακιά
375
- expected: Sfakiá
376
- - source: Τήλος
377
- expected: Tílos
378
- - source: Τήνος
379
- expected: Tínos
380
- - source: Τρίκαλα
381
- expected: Tríkala
382
- - source: Τρίπολη
383
- expected: Trípoli
384
- - source: Τσακωνιά
385
- expected: Tsakoniá
386
- - source: Ύδρα
387
- expected: Ídhra
388
- - source: Φάληρο
389
- expected: Fáliro
390
- - source: Φλώρινα
391
- expected: Flórina
392
- - source: Φολέγανδρος
393
- expected: Folégandros
394
- - source: Χάλκη
395
- expected: Khálki
396
- - source: Χαλκίδα
397
- expected: Khalkídha
398
- - source: Χαλάνδρι
399
- expected: Khalándri
400
- - source: Χαλκιδική
401
- expected: Khalkidhikí
402
- - source: Χανιά
403
- expected: Khaniá
404
- - source: Χίος
405
- expected: Khíos
406
- - source: Ψαρά
407
- expected: Psará
408
- - source: Αβάνα
409
- expected: Avána
410
- - source: Αγγλία
411
- expected: Anglía
412
- - source: Αϊβαλί
413
- expected: Aïvalí
414
- - source: Αλεξάνδρεια
415
- expected: Alexándria
416
- - source: Άμστερνταμ
417
- expected: Ámsterndam
418
- - source: Βαυαρία
419
- expected: Vavaría
420
- - source: Βενετία
421
- expected: Venetía
422
- - source: Βερολίνο
423
- expected: Verolíno
424
- - source: Βερόνα
425
- expected: Veróna
426
- - source: Βιέννη
427
- expected: Viénni
428
- - source: Γένοβα
429
- expected: Yénova
430
- - source: Δουβλίνο
431
- expected: Dhouvlíno
432
- - source: Καλαβρία
433
- expected: Kalavría
434
- - source: Καλιφόρνια
435
- expected: Kalifórnia
436
- - source: Καύκασος
437
- expected: Kávkasos
438
- - source: Κονγκό
439
- expected: Konngó
440
- - source: Κορσική
441
- expected: Korsikí
442
- - source: Κουρδιστάν
443
- expected: Kourdhistán
444
- - source: Κωνσταντινούπολη
445
- expected: Konstandinoúpoli
446
- - source: Κατεχόμενη Κύπρος
447
- expected: Katekhómeni Kípros
448
- - source: Λαπωνία
449
- expected: Laponía
450
- - source: Λευκωσία
451
- expected: Levkosía
452
- - source: Λιβόρνο
453
- expected: Livórno
454
- - source: Λονδίνο
455
- expected: Londhíno
456
- - source: Λυών
457
- expected: Lión
458
- - source: Μάλαγα
459
- expected: Málaga
460
- - source: Μασσαλία
461
- expected: Massalía
462
- - source: Μικρονησία
463
- expected: Mikronisía
464
- - source: Μιλάνο
465
- expected: Miláno
466
- - source: Μόσχα
467
- expected: Móskha
468
- - source: Μπολόνια
469
- expected: Bolónia
470
- - source: Νάπολη
471
- expected: Nápoli
472
- - source: Νταγκεστάν
473
- expected: Dangestán
474
- - source: Νέα Υόρκη
475
- expected: Néa Iórki
476
- - source: Οξφόρδη
477
- expected: Oxfórdhi
478
- - source: Ουαλία
479
- expected: Oualía
480
- - source: Παρίσι
481
- expected: Parísi
482
- - source: Πάφος
483
- expected: Páfos
484
- - source: Πολυνησία
485
- expected: Polinisía
486
- - source: Ρώμη
487
- expected: Rómi
488
- - source: Σαμάρεια
489
- expected: Samária
490
- - source: Σικελία
491
- expected: Sikelía
492
- - source: Σκανδιναβία
493
- expected: Skandhinavía
494
- - source: Σκόπια
495
- expected: Skópia
496
- - source: Σκωτία
497
- expected: Skotía
498
- - source: Σμύρνη
499
- expected: Smírni
500
- - source: Ταϊτή
501
- expected: Taïtí
502
- - source: Ταταρστάν
503
- expected: Tatarstán
504
- - source: Τζαμάικα
505
- expected: Tzamáika
506
- - source: Τηλλυρία
507
- expected: Tilliría
508
- - source: Τιρόλο
509
- expected: Tirólo
510
- - source: Τορίνο
511
- expected: Toríno
512
- - source: Φανάρι
513
- expected: Fanári
514
- - source: Φλωρεντία
515
- expected: Florendía
516
- - source: Χαβάη
517
- expected: Khaváï
518
- - source: Χονγκ Κονγκ
519
- expected: Khonng Konng
520
-
521
- map:
522
- # https://en.wikipedia.org/wiki/Romanization_of_Greek
523
- rules:
524
- - pattern: (?<=[ΑαΕεΗη])\u03A5 # Υ (after Α, Ε, Η)
525
- result: V
526
- - pattern: (?<=[ΑαΕεΗη])\u03C5 # υ (after Α, Ε, Η)
527
- result: v
528
- - pattern: (?<=[Οο])\u03A5 # Υ (after Ο)
529
- result: U
530
- - pattern: (?<=[Οο])\u03C5 # υ (after Ο)
531
- result: u
532
- - pattern: (?<=[Οο])\u03CD # ύ (after Ο)
533
- result: ú
534
- - pattern: \u03A5[Ιιί] # ΥΙ
535
- result: I
536
- - pattern: \u03C5[Ιιί] # υι
537
- result: i
538
- - pattern: \u03A5[ί] # ΥΙ
539
- result: Í
540
- - pattern: \u03C5[ί] # υι
541
- result: í
542
- - pattern: \u0393(?=[ξΞχΧ]) # Γ (before Γ, Ξ, Χ)
543
- result: N
544
- - pattern: \u03B3(?=[ξΞχΧ]) # γ (before Γ, Ξ, Χ)
545
- result: n
546
- - pattern: \u0393[Γγ] # Γ (before Γ, Ξ, Χ)
547
- result: Ng
548
- - pattern: \u03B3\u03B3 # γ (before Γ, Ξ, Χ)
549
- result: ng
550
- - pattern: (?<=\b)\u0393[Κκ] # Γ (before Κ initially)
551
- result: G
552
- - pattern: (?<=\b)\u03B3[Κκ] # γ (before Κ initially)
553
- result: g
554
- - pattern: (?<!\b)\u0393[Κκ] # Γ (before Κ medially)
555
- result: Ng
556
- - pattern: (?<!\b)\u03B3[Κκ] # γ (before Κ medially)
557
- result: ng
558
- - pattern: \u0393(?=[ΕεέΗηήΙιίΥυύ]) # Γ (before front vowels)
559
- result: Y
560
- - pattern: \u03B3(?=[ΕεέΗηήΙιίΥυύ]) # γ (before front vowels)
561
- result: y
562
- - pattern: \u0393(?=[Oo][Ιιί]) # Γ (before front vowels)
563
- result: Y
564
- - pattern: \u03B3(?=[Oo][Ιιί]) # γ (before front vowels)
565
- result: y
566
- - pattern: (?<=\b)\u039D[τΤ] # ΝΤ (initially)
567
- result: D
568
- - pattern: (?<=\b)\u03BD[τΤ] # ντ (initially)
569
- result: d
570
- - pattern: \u039D[τΤ][ζΖ] # ΝΤΖ
571
- result: NTZ
572
- - pattern: \u03BD[τΤ][ζΖ] # ντζ
573
- result: ntz
574
- - pattern: (?<!\b)\u039D[τΤ] # ΝΤ (medially)
575
- result: Nd
576
- - pattern: (?<!\b)\u03BD[τΤ] # ντ (medially)
577
- result: nd
578
- - pattern: (?<=\b)\u039C[πΠ] # ΜΠ (initially)
579
- result: B
580
- - pattern: (?<=\b)\u03BC[πΠ] # μπ (initially)
581
- result: b
582
- - pattern: \u039C[πΠ] # ΜΠ (medially)
583
- result: Mb
584
- - pattern: \u03BC[πΠ] # μπ (medially)
585
- result: mb
586
- - pattern: (?<=[νΝ])\u0394(?=[ρΡ]) # νδρ
587
- result: d
588
- - pattern: (?<=[νΝ])\u03B4(?=[ρΡ]) # νδρ
589
- result: d
590
- - pattern: (?<=[ΑΆαά])\u0395 # ΑΕ
591
- result: Ë
592
- - pattern: (?<=[ΑΆαά])\u03B5 # αε
593
- result: ë
594
- - pattern: (?<=[ΑΆαά])\u03AD # αέ
595
- result: ë́
596
- - pattern: (?<=[ΩΏωώ])\u039F # ΩΟ
597
- result: Ö
598
- - pattern: (?<=[ΩΏωώ])\u03BF # ωο
599
- result: ö
600
- - pattern: (?<=[ΩΏωώ])\u03CC # ωό
601
- result: ö́
602
- - pattern: (?<=[ΑΆαάΟΌοό])\u0397 # ΑΗ, ΟΗ
603
- result: Ï
604
- - pattern: (?<=[ΑΆαάΟΌοό])\u03B7 # αη, οη
605
- result: ï
606
- - pattern: (?<=[ΑΆαάΟΌοό])\u03AE # αή, οή
607
- result: ḯ
608
- - pattern: \u037E # ;
609
- result: "?"
610
- - pattern: \u003B # ;
611
- result: "?"
612
-
613
- characters:
614
- "\u0027": ""
615
- "\u0386": "Á" # Ά
616
- "\u0391": "A" # Α
617
- "\u0392": "V" # Β
618
- "\u0393": "G" # Γ
619
- "\u0394": "Dh" # Δ
620
- "\u0395": "E" # Ε
621
- "\u0395\u0399": "I" # ΕΙ
622
- "\u0395\u03B9": "I" # Ει
623
- "\u0395\u03AF": "Í" # Εί
624
- "\u0395\u03AA": "Εï" # ΕΪ
625
- "\u0395\u03CA": "Εï" # Εϊ
626
- "\u0388\u03CA": "Éï" # Έϊ
627
- "\u0388\u03CA": "Éï" # Έι
628
- "\u0391\u03CD": "Áv" # Αύ
629
- "\u0395\u03CD": "Év" # Εύ
630
- "\u0397\u03CD": "Ív" # Ηύ
631
- "\u0396": "Z" # Ζ
632
- "\u0397": "I" # Η
633
- "\u0398": "Th" # Θ
634
- "\u0399": "I" # Ι
635
- "\u039A": "K" # Κ
636
- "\u039B": "L" # Λ
637
- "\u039C": "M" # Μ
638
- "\u039D": "N" # Ν
639
- "\u039E": "X" # Ξ
640
- "\u039F": "O" # Ο
641
- "\u03A0": "P" # Π
642
- "\u03A1": "R" # Ρ
643
- "\u03A3": "S" # Σ
644
- "\u03A4": "T" # Τ
645
- "\u03A5": "I" # Υ
646
- "\u03A6": "F" # Φ
647
- "\u03A7": "Kh" # Χ
648
- "\u03A8": "Ps" # Ψ
649
- "\u03A9": "O" # Ω
650
- "\u0388": "É" # Έ
651
- "\u0389": "Í" # Ή
652
- "\u038A": "Í" # Ί
653
- "\u038C": "Ó" # Ό
654
- "\u038E": "Í" # Ύ
655
- "\u038F": "Ó" # Ώ
656
- "\u03AA": "Ï" # Ϊ
657
- "\u03AB": "Ï" # Ϋ
658
-
659
- "\u03AC": "á" # ά
660
- "\u03B1": "a" # α
661
- "\u03B2": "v" # β
662
- "\u03B3": "g" # γ
663
- "\u03B4": "dh" # δ
664
- "\u03B5": "e" # ε
665
- "\u03B5\u03B9": "i" # ει
666
- "\u03B5\u03AF": "í" # εί
667
- "\u03B5\u03CA": "eï" # εϊ
668
- "\u03AD\u03CA": "éï" # έϊ
669
- "\u03AD\u03B9": "éï" # έι
670
- "\u03B1\u03CD": "áv" # αύ
671
- "\u03B5\u03CD": "év" # εύ
672
- "\u03B7\u03CD": "ív" # ηύ
673
- "\u03B6": "z" # ζ
674
- "\u03B7": "i" # η
675
- "\u03B8": "th" # θ
676
- "\u03B9": "i" # ι
677
- "\u03BA": "k" # κ
678
- "\u03BB": "l" # λ
679
- "\u03BC": "m" # μ
680
- "\u03BD": "n" # ν
681
- "\u03BE": "x" # ξ
682
- "\u03BF": "o" # ο
683
- "\u03C0": "p" # π
684
- "\u03C1": "r" # ρ
685
- "\u03C3": "s" # σ
686
- "\u03C2": "s" # ς
687
- "\u03C4": "t" # τ
688
- "\u03C5": "i" # υ
689
- "\u03C6": "f" # φ
690
- "\u03C7": "kh" # χ
691
- "\u03C8": "ps" # ψ
692
- "\u03C9": "o" # ω
693
- "\u03AD": "é" # έ
694
- "\u03AE": "í" # ή
695
- "\u03AF": "í" # ί
696
- "\u03CC": "ó" # ό
697
- "\u03CD": "í" # ύ
698
- "\u03CE": "ó" # ώ
699
- "\u03CA": "ï" # ϊ
700
- "\u03CB": "ï" # ϋ
701
- "\u0390": "ḯ" # ΐ
702
- "\u03B0": "ḯ" # ΰ
703
-
704
- "\u0387": ";" # ·
705
- "\u00B7": ";" # ·