interscript 0.1.6 → 2.1.0a9

Sign up to get free protection for your applications and to get access to all the features.
Files changed (226) hide show
  1. checksums.yaml +4 -4
  2. data/.gitignore +11 -0
  3. data/.rspec +3 -0
  4. data/Gemfile +29 -0
  5. data/LICENSE.adoc +31 -0
  6. data/README.md +3 -0
  7. data/Rakefile +53 -0
  8. data/bin/console +14 -0
  9. data/bin/interscript +3 -39
  10. data/bin/maps_analyze_staging +168 -0
  11. data/bin/maps_debug_compilers +58 -0
  12. data/bin/maps_debug_ordering +88 -0
  13. data/bin/maps_debug_ruby_compile +24 -0
  14. data/bin/maps_debug_step_by_step +44 -0
  15. data/bin/maps_optimize_order +112 -0
  16. data/bin/maps_v1_analyze_regexps +45 -0
  17. data/bin/maps_v1_to_v2 +426 -0
  18. data/exe/interscript +6 -0
  19. data/interscript.gemspec +31 -0
  20. data/lib/interscript.rb +81 -127
  21. data/lib/interscript/command.rb +5 -5
  22. data/lib/interscript/compiler.rb +22 -0
  23. data/lib/interscript/compiler/javascript.rb +292 -0
  24. data/lib/interscript/compiler/ruby.rb +262 -0
  25. data/lib/interscript/dsl.rb +67 -0
  26. data/lib/interscript/dsl/aliases.rb +23 -0
  27. data/lib/interscript/dsl/document.rb +46 -0
  28. data/lib/interscript/dsl/group.rb +45 -0
  29. data/lib/interscript/dsl/group/parallel.rb +6 -0
  30. data/lib/interscript/dsl/items.rb +89 -0
  31. data/lib/interscript/dsl/metadata.rb +26 -0
  32. data/lib/interscript/dsl/stage.rb +6 -0
  33. data/lib/interscript/dsl/symbol_mm.rb +11 -0
  34. data/lib/interscript/dsl/tests.rb +12 -0
  35. data/lib/interscript/interpreter.rb +251 -0
  36. data/lib/interscript/node.rb +25 -0
  37. data/lib/interscript/node/alias_def.rb +15 -0
  38. data/lib/interscript/node/dependency.rb +13 -0
  39. data/lib/interscript/node/document.rb +45 -0
  40. data/lib/interscript/node/group.rb +34 -0
  41. data/lib/interscript/node/group/parallel.rb +9 -0
  42. data/lib/interscript/node/group/sequential.rb +2 -0
  43. data/lib/interscript/node/item.rb +52 -0
  44. data/lib/interscript/node/item/alias.rb +42 -0
  45. data/lib/interscript/node/item/any.rb +61 -0
  46. data/lib/interscript/node/item/capture.rb +50 -0
  47. data/lib/interscript/node/item/group.rb +51 -0
  48. data/lib/interscript/node/item/repeat.rb +40 -0
  49. data/lib/interscript/node/item/stage.rb +23 -0
  50. data/lib/interscript/node/item/string.rb +51 -0
  51. data/lib/interscript/node/metadata.rb +18 -0
  52. data/lib/interscript/node/rule.rb +6 -0
  53. data/lib/interscript/node/rule/funcall.rb +18 -0
  54. data/lib/interscript/node/rule/run.rb +15 -0
  55. data/lib/interscript/node/rule/sub.rb +65 -0
  56. data/lib/interscript/node/stage.rb +19 -0
  57. data/lib/interscript/node/tests.rb +15 -0
  58. data/lib/interscript/stdlib.rb +211 -0
  59. data/lib/interscript/utils/regexp_converter.rb +283 -0
  60. data/lib/interscript/version.rb +1 -1
  61. data/requirements.txt +1 -0
  62. metadata +75 -339
  63. data/README.adoc +0 -298
  64. data/bin/rspec +0 -29
  65. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  66. data/lib/g2pwrapper.py +0 -34
  67. data/lib/interscript-opal.rb +0 -2
  68. data/lib/interscript/fs.rb +0 -71
  69. data/lib/interscript/mapping.rb +0 -142
  70. data/lib/interscript/opal.rb +0 -27
  71. data/lib/interscript/opal/maps.js.erb +0 -10
  72. data/lib/interscript/opal_map_translate.rb +0 -12
  73. data/lib/model-7 +0 -0
  74. data/lib/tha-pt-b-7 +0 -0
  75. data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38912
  76. data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -509
  77. data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
  78. data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1283
  79. data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -159
  80. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -141
  81. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -125
  82. data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
  83. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -94
  84. data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -624
  85. data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -627
  86. data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
  87. data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
  88. data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -146
  89. data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -94
  90. data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -170
  91. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
  92. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
  93. data/maps/alalc-pan-Deva-Latn-1997.yaml +0 -237
  94. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -221
  95. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
  96. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -114
  97. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
  98. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -141
  99. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
  100. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
  101. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
  102. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
  103. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
  104. data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -31
  105. data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
  106. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
  107. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
  108. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -528
  109. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -592
  110. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
  111. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
  112. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -184
  113. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -285
  114. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -115
  115. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -38
  116. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -701
  117. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -19
  118. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
  119. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -127
  120. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
  121. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
  122. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
  123. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
  124. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -159
  125. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
  126. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -200
  127. data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +0 -92
  128. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -314
  129. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -166
  130. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -162
  131. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -208
  132. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
  133. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
  134. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
  135. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
  136. data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +0 -166
  137. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
  138. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
  139. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
  140. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
  141. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
  142. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
  143. data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -168
  144. data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
  145. data/maps/dos-nep-Deva-Latn-1997.yaml +0 -33
  146. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
  147. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
  148. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
  149. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
  150. data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -88
  151. data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
  152. data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
  153. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -186
  154. data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
  155. data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
  156. data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
  157. data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
  158. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
  159. data/maps/icao-per-Arab-Latn-9303.yaml +0 -103
  160. data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
  161. data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
  162. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
  163. data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
  164. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -609
  165. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -40
  166. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -62
  167. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +0 -901
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
  172. data/maps/moct-kor-Hang-Latn-2000.yaml +0 -803
  173. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
  174. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
  175. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
  176. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
  177. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
  178. data/maps/nil-kor-Hang-Hang-jamo.yaml +0 -11193
  179. data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
  180. data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
  181. data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
  182. data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
  183. data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
  184. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
  185. data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
  186. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
  187. data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
  188. data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
  189. data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
  190. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
  191. data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
  192. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
  193. data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
  194. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
  195. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
  196. data/maps/royin-tha-Thai-Latn-1968.yaml +0 -179
  197. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
  198. data/maps/royin-tha-Thai-Latn-1999.yaml +0 -76
  199. data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24759
  200. data/maps/ses-ara-Arab-Latn-1930.yaml +0 -279
  201. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
  202. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -193
  203. data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
  204. data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
  205. data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
  206. data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
  207. data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
  208. data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
  209. data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
  210. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +0 -780
  211. data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
  212. data/maps/un-nep-Deva-Latn-1972.yaml +0 -163
  213. data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
  214. data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -30
  215. data/maps/ungegn-amh-Ethi-Latn-2016.yaml +0 -575
  216. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
  217. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
  218. data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
  219. data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
  220. data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
  221. data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
  222. data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
  223. data/maps/var-zho-Hani-Latn-1979.yaml +0 -38908
  224. data/spec/interscript/mapping_spec.rb +0 -42
  225. data/spec/interscript_spec.rb +0 -26
  226. data/spec/spec_helper.rb +0 -3
@@ -1,323 +0,0 @@
1
- ---
2
- authority_id: iso
3
- id: 233-1984
4
- language: ara
5
- source_script: Arab
6
- destination_script: Latn
7
- name: ISO 233:1984 Documentation — Transliteration of Arabic characters into Latin characters
8
- url:
9
- - https://www.iso.org/standard/4117.html
10
- - http://transliteration.eki.ee/pdf/Arabic_2.2.pdf
11
- - http://www.eki.ee/wgrs/rom1_ar.pdf
12
- creation_date: 1984
13
- confirmation date: 2018-06
14
- description: |
15
- Is one of a series of International Standards dealing with
16
- the conversion of systems of writing, following the
17
- principles of stringent conversion in order to permit
18
- international information exchange. Its aim is to provide a
19
- means for international communication of written messages
20
- in a form which permits the automatic transmission and
21
- reconstitution of these by men or machines. Cancels and
22
- replaces ISO Recommendation R 233-1961
23
- notes:
24
- - |
25
- The transliteration ISO 233:1984 WRT ara-arab-latn-2017 gives every character and diacritical mark a unique
26
- equivalent and e.g. long vowels in Arabic ā, ī and ū are consequently written a’, iy and uw
27
- respectively in the ISO transliteration. Other main correspondences
28
- ث is ṯ instead of th
29
- ج is ǧ instead of j
30
- ح is ḥ instead of ẖ
31
- خ is ẖ instead of kh
32
- ذ is ḏ instead of dh
33
- ش is š instead of sh
34
- ص is ṣ instead of s̱
35
- ض is ḍ instead of ḏ
36
- ط is ṭ instead of ṯ
37
- ظ is ẓ instead of d͟h
38
- غ is ġ instead of gh
39
- ة is ẗ instead of h/t
40
- ى is ỳ
41
- ـِي is iy instead of iy
42
- ـُو is uw instead of ū
43
- ـَا is a’ instead of ā
44
- ـَى is aỳ instead of á
45
-
46
- tests:
47
-
48
- - source: مِصر
49
- expected: Miṣr
50
-
51
- - source: قَطَر
52
- expected: Qaṭar
53
-
54
- - source: الجُمهُورِيَّة العِرَاقِيَّة
55
- expected: Al Ǧumhuwriyaẗ al ‘Ira’qiyaẗ
56
-
57
- - source: جُمهُورِيَّة مِصر العَرَبِيَّة
58
- expected: Ǧumhuwriyaẗ Miṣr al ‘Arabiyaẗ
59
-
60
- - source: الرِيَاض
61
- expected: Ar Riya’ḍ
62
-
63
- - source: الشارِقة
64
- expected: Aš Šâriqaẗ
65
-
66
- map:
67
- postrules:
68
- - pattern: (?<=\b)(?<!\b[‘|’|'])[\u0061-\uFFFF]
69
- result: "upcase"
70
- # don't capitalize defined article in the middle of a sentence
71
- - pattern : ' At T' # الت
72
- result: ' at T'
73
- - pattern : ' Aṯ Ṯ' # الث
74
- result: ' aṯ Ṯ'
75
- - pattern : ' Ad D' # الد
76
- result: ' ad D'
77
- - pattern : ' Aḏ Ḏ' # الذ
78
- result: ' aḏ Ḏ'
79
- - pattern : ' Ar R' # الر
80
- result: ' ar R'
81
- - pattern : ' Az Z' # الز
82
- result: ' az Z'
83
- - pattern : ' As S' # الس
84
- result: ' as S'
85
- - pattern : ' Aš Š' # الش
86
- result: ' aš Š'
87
- - pattern : ' Aṣ Ṣ' # الص
88
- result: ' aṣ Ṣ'
89
- - pattern : ' Aḍ Ḍ' # الض
90
- result: ' aḍ Ḍ'
91
- - pattern : ' Aṭ Ṭ' # الط
92
- result: ' aṭ Ṭ'
93
- - pattern : ' Aẓ Ẓ' # الظ
94
- result: ' aẓ Ẓ'
95
- - pattern : ' Al L' # الل
96
- result: ' al L'
97
- - pattern : ' an n' # الن
98
- result: ' an N'
99
- - pattern: " Al " # ال
100
- result: " al "
101
-
102
- characters:
103
-
104
- # pointing
105
- '\u064e' : 'a' # َ fatha
106
- '\u064e(?=\u0629)' : '' # َ fatha followed by ta' marboota
107
- '\u0650' : 'i' # ِ kasra
108
- '\u064f' : 'u' # ُ damma
109
- '\u0652' : '' # ْ sokoon, see note A below
110
-
111
- # special pointed letters
112
- # special pointed letters
113
- '\u0639\u064e' : '‘a' # عَ
114
- '\u0639\u0650' : '‘i' # عِ
115
- '\u0639\u064f' : '‘ū' # عُ
116
- # handle MacOS regex difference
117
- '\u0639\u064f\u0648' : '‘ū' # عُو damma followed by و
118
-
119
- '\u0650\u064a' : 'iy' # ـِي kasra followed by ي
120
- '\u0650\u064a\u0651\u064e' : 'iy' # ـِيَّ
121
- '\u0650\u064a(?=\u064e|u064f)' : 'iy' # ـِي kasra followed by ي
122
- '\u064e\u0627' : 'a’' # ـَا fatha followed by ا
123
- '\u064e\u0649' : 'aỳ' # ـَى fatha followed by ى which is ا not ي
124
- '\u064f\u0648' : 'uw' # ـُو damma followed by و
125
- '\u064e\u0648\u0652' : 'aw' # ـَوْ
126
- '\u064e\u064a\u0652' : 'ay' # ـَيْ
127
-
128
- # Sun letters
129
-
130
- '\b\u0627\u0644\u062a' : 'at t' # الت
131
- '\b\u0627\u0644\u062b' : 'aṯ ṯ' # الث
132
- '\b\u0627\u0644\u062f' : 'ad d' # الد
133
- '\b\u0627\u0644\u0630' : 'aḏ ḏ' # الذ
134
- '\b\u0627\u0644\u0631' : 'ar r' # الر
135
- '\b\u0627\u0644\u0632' : 'az z' # الز
136
- '\b\u0627\u0644\u0633' : 'as s' # الس
137
- '\b\u0627\u0644\u0634' : 'aš š' # الش
138
- '\b\u0627\u0644\u0635' : 'aṣ ṣ' # الص
139
- '\b\u0627\u0644\u0636' : 'aḍ ḍ' # الض
140
- '\b\u0627\u0644\u0637' : 'aṭ ṭ' # الط
141
- '\b\u0627\u0644\u0638' : 'aẓ ẓ' # الظ
142
- '\b\u0627\u0644\u0644' : 'al l' # الل
143
- '\b\u0627\u0644\u0646' : 'an n' # الن
144
-
145
- # ta' marboota in iso-233-1984 is all the same `aẗ`
146
- '\u0629' : 'aẗ' # ة in the middle of the sentence
147
-
148
- # Shadda
149
-
150
-
151
- '\u0628\u0651' : 'bb' # ب
152
- '\u062a\u0651' : 'tt' # ت
153
- '\u062b\u0651' : 'ṯṯ' # ث
154
- '\u062c\u0651' : 'ǧǧ' # ج
155
- '\u062d\u0651' : 'ḥḥ' # ح
156
- '\u062e\u0651' : 'ẖẖ' # خ
157
- '\u062f\u0651' : 'dd' # د
158
- '\u0630\u0651' : 'ḏḏ' # ذ
159
- '\u0631\u0651' : 'rr' # ر
160
- '\u0632\u0651' : 'zz' # ز
161
- '\u0633\u0651' : 'ss' # س
162
- '\u0634\u0651' : 'šš' # ش
163
- '\u0635\u0651' : 'ṣṣ' # ص
164
- '\u0636\u0651' : 'ḍḍ' # ض
165
- '\u0637\u0651' : 'ṭṭ' # ط
166
- '\u0638\u0651' : 'ẓẓ' # ظ
167
- '\u063a\u0651' : 'ġġ' # غ
168
- '\u0641\u0651' : 'ff' # ف
169
- '\u0642\u0651' : 'qq' # ق
170
- '\u0643\u0651' : 'kk' # ك
171
- '\u0644\u0651' : 'll' # ل
172
- '\u0645\u0651' : 'mm' # م
173
- '\u0646\u0651' : 'nn' # ن
174
- '\u0647\u0651' : 'hh' # ه
175
- '\u0648\u0651' : 'ww' # و
176
- '\u064a\u0651' : 'yy' # ي
177
-
178
-
179
- '\u0622' : '’â' # آ
180
-
181
- '\u0627' : 'â' # ا
182
-
183
- '\u0649' : 'ỳ' # ى
184
-
185
- '\u0626' : "'" # ئ
186
-
187
-
188
- '\u0621' : # ء
189
- - '’'
190
- - '' # see note A
191
-
192
- '\u0623' : 'a' # أ
193
-
194
- # See note B
195
- '\b\u0627\u0644' : 'al ' # ال
196
- # '\uFE8E' : '' # ﺎ
197
-
198
- '\u0628' : 'b' # ب
199
- '\uFE91' : 'b' # ﺑ
200
- '\uFE92' : 'b' # ﺒ
201
- '\uFE90' : 'b' # ﺐ
202
-
203
- # See note C
204
- '\u062a' : 't' # ت
205
- '\ufe97' : 't' # ﺗ
206
- '\ufe98' : 't' # ﺘ
207
- '\ufe96' : 't' # ﺖ
208
-
209
- '\u062b' : 'ṯ' # ث
210
- '\ufe9b' : 'ṯ' # ﺛ
211
- '\ufe9c' : 'ṯ' # ﺜ
212
- '\ufe9a' : 'ṯ' # ﺚ
213
-
214
- '\u062c' : 'ǧ' # ج
215
- '\ufe9f' : 'ǧ' # ﺟ
216
- '\ufea0' : 'ǧ' # ﺠ
217
- '\ufe9e' : 'ǧ' # ﺞ
218
-
219
- '\u062d' : 'ḥ' # ح
220
- '\ufea3' : 'ḥ' # ﺣ
221
- '\ufea4' : 'ḥ' # ﺤ
222
- '\ufea2' : 'ḥ' # ﺢ
223
-
224
- '\u062e' : 'ẖ' # خ
225
- '\ufea7' : 'ẖ' # ﺧ
226
- '\ufea8' : 'ẖ' # ﺨ
227
- '\ufea6' : 'ẖ' # ﺦ
228
-
229
- '\u062f' : 'd' # د
230
- '\ufeaa' : 'd' # ﺪ
231
-
232
- '\u0630' : 'ḏ' # ذ
233
- '\ufeac' : 'ḏ' # ﺬ
234
-
235
- '\u0631' : 'r' # ر
236
- '\ufeae' : 'r' # ﺮ
237
-
238
- '\u0632' : 'z' # ز
239
- '\ufeb0' : 'z' # ﺰ
240
-
241
- '\u0633' : 's' # س
242
- '\ufeb3' : 's' # ﺳ
243
- '\ufeb4' : 's' # ﺴ
244
- '\ufeb2' : 's' # ﺲ
245
-
246
- '\u0634' : 'š' # ش
247
- '\ufeb7' : 'š' # ﺷ
248
- '\ufeb8' : 'š' # ﺸ
249
- '\ufeb6' : 'š' # ﺶ
250
-
251
- '\u0635' : 'ṣ' # ص
252
- '\ufebb' : 'ṣ' # ﺻ
253
- '\ufebc' : 'ṣ' # ﺼ
254
- '\ufeba' : 'ṣ' # ﺺ
255
-
256
- '\u0636' : 'ḍ' # ض
257
- '\ufebf' : 'ḍ' # ﺿ
258
- '\ufec0' : 'ḍ' # ﻀ
259
- '\ufebe' : 'ḍ' # ﺾ
260
-
261
- '\u0637' : 'ṭ' # ط
262
- '\ufec3' : 'ṭ' # ﻃ
263
- '\ufec4' : 'ṭ' # ﻄ
264
- '\ufec2' : 'ṭ' # ﻂ
265
-
266
- '\u0638' : 'ẓ' # ظ
267
- '\ufec7' : 'ẓ' # ﻇ
268
- '\ufec8' : 'ẓ' # ﻈ
269
- '\ufec6' : 'ẓ' # ﻆ
270
-
271
- '\u0639' : '‘' # ع
272
- '\ufecb' : '‘' # ﻋ
273
- '\ufecc' : '‘' # ﻌ
274
- '\ufeca' : '‘' # ﻊ
275
-
276
- '\u063a' : 'ġ' # غ
277
- '\ufecf' : 'ġ' # ﻏ
278
- '\ufed0' : 'ġ' # ﻐ
279
- '\ufece' : 'ġ' # ﻎ
280
-
281
- '\u0641' : 'f' # ف
282
- '\ufed3' : 'f' # ﻓ
283
- '\ufed4' : 'f' # ﻔ
284
- '\ufed2' : 'f' # ﻒ
285
-
286
- '\u0642' : 'q' # ق
287
- '\ufed7' : 'q' # ﻗ
288
- '\ufed8' : 'q' # ﻘ
289
- '\ufed6' : 'q' # ﻖ
290
-
291
- '\u0643' : 'k' # ك
292
- '\ufedb' : 'k' # ﻛ
293
- '\ufedc' : 'k' # ﻜ
294
- '\ufeda' : 'k' # ﻚ
295
-
296
- '\u0644' : 'l' # ل
297
- '\ufedf' : 'l' # ﻟ
298
- '\ufee0' : 'l' # ﻠ
299
- '\ufede' : 'l' # ﻞ
300
-
301
- '\u0645' : 'm' # م
302
- '\ufee3' : 'm' # ﻣ
303
- '\ufee4' : 'm' # ﻤ
304
- '\ufee2' : 'm' # ﻢ
305
-
306
- '\u0646' : 'n' # ن
307
- '\ufee7' : 'n' # ﻧ
308
- '\ufee8' : 'n' # ﻨ
309
- '\ufee6' : 'n' # ﻦ
310
-
311
- # See note C
312
- '\u0647' : 'h' # ه
313
- '\ufeeb' : 'h' # ﻫ
314
- '\ufeec' : 'h' # ﻬ
315
- '\ufeea' : 'h' # ﻪ
316
-
317
- '\u0648' : 'w' # و
318
- '\ufeee' : 'w' # ﻮ
319
-
320
- '\u064a' : 'y' # ي
321
- '\ufef3' : 'y' # ﻳ
322
- '\ufef4' : 'y' # ﻴ
323
- '\ufef1' : 'y' # ﻱ
@@ -1,609 +0,0 @@
1
- ---
2
- authority_id: iso
3
- id: 1997
4
- language: ell
5
- source_script: Grek
6
- destination_script: Latn
7
- name: ISO 843:1997
8
- url:
9
- creation_date: 1997
10
- description: |
11
- ISO Transliteration table for Greek
12
-
13
- note:
14
- - Transliteration of Greek into Latin: Type 1, Clause 3 Table 1
15
- - Equivalent to elot-ell-Grek-Latn-743-2001-ts, the transliteration table of ELOT 743:2001
16
- - Assuming that ou, au, eu transliterations are only intended for historical diphthongs /u, av, ev/, and that όυ, άυ, έυ are not to be transliterated as ou, au, eu
17
- - Introduced casing to digamma and lunate sigma. (Casing was late introduction to character sets for those characters)
18
-
19
- tests:
20
-
21
- - source: |
22
- Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
23
-
24
- Γιάννης Μακρυγιάννης.
25
-
26
- expected: |
27
- Éna práma mónon me parakínīse ki eména na grápsō óti toútīn tīn patrída tīn échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai ftōchoí kai politikoí kai stratiōtikoí kai oi pléon mikróteroi ánthrōpoi; ósoi agōnistī́kamen, analógōs o katheís, échomen na zī́somen edṓ. To loipón doulépsamen óloi mazí, na tīn fylámen ki óloi mazí kai na mīn légei oúte o dynatós «egṓ» oúte o adýnatos. Xérete póte na légei o katheís «egṓ»? Ótan agōnisteí mónos tou kai fkiásei ī́ chalásei, na légei «egṓ»; ótan ómōs agōnízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egṓ». Kai eis to exī́s na máthomen gnṓsī, an thélomen na fkiásomen chōrión, na zī́somen óloi mazí.
28
-
29
- Giánnīs Makrygiánnīs.
30
-
31
-
32
- - source: ΑΘΗΝΑ
33
- expected: ATHĪNA
34
- - source: μπαμπάκι
35
- expected: mpampáki
36
- - source: νταντά
37
- expected: ntantá
38
- - source: γκέγκε
39
- expected: gkégke
40
- - source: Γκαμπόν
41
- expected: Gkampón
42
- - source: Μάγχη
43
- expected: Mágchī
44
- - source: κογξ
45
- expected: kogx
46
- - source: υιός
47
- expected: yiós
48
- - source: Υιός
49
- expected: Yiós
50
- - source: νεράντζι
51
- expected: nerántzi
52
- - source: Γοίθιος
53
- expected: Goíthios
54
- - source: μπέικον
55
- expected: mpéikon
56
- - source: μπέϊκον
57
- expected: mpéïkon
58
- - source: βόλεϊ
59
- expected: vóleï
60
- - source: αθεΐα
61
- expected: atheḯa
62
- - source: Εϊγιαφιάτλαγιοκουτλ
63
- expected: Eïgiafiátlagiokoutl
64
- - source: Εΐτζι
65
- expected: Eḯtzi
66
- - source: Μυρτώο
67
- expected: Myrtṓo
68
- - source: αέρας
69
- expected: aéras
70
- - source: γαυ γαυ
71
- expected: gau gau
72
- - source: Ταΰγετος
73
- expected: Taÿ́getos
74
- - source: σπρέυ
75
- expected: spréy
76
-
77
- - source: Αθήνα
78
- expected: Athī́na
79
- - source: Άγιον Όρος
80
- expected: Ágion Óros
81
- - source: Άγραφα
82
- expected: Ágrafa
83
- - source: Αγρίνιο
84
- expected: Agrínio
85
- - source: Αίγινα
86
- expected: Aígina
87
- - source: Αίγιο
88
- expected: Aígio
89
- - source: Αλεξανδρούπολη
90
- expected: Alexandroúpolī
91
- - source: Αλεποχώρι
92
- expected: Alepochṓri
93
- - source: Αμοργός
94
- expected: Amorgós
95
- - source: Άμφισσα
96
- expected: Ámfissa
97
- - source: Αράχωβα
98
- expected: Aráchōva
99
- - source: Άργος
100
- expected: Árgos
101
- - source: Αρκαδία
102
- expected: Arkadía
103
- - source: Άρτα
104
- expected: Árta
105
- - source: Βελούχι
106
- expected: Veloúchi
107
- - source: Βέροια
108
- expected: Véroia
109
- - source: Βοιωτία
110
- expected: Voiōtía
111
- - source: Βόλος
112
- expected: Vólos
113
- - source: Βόνιτσα
114
- expected: Vónitsa
115
- - source: Γαλαξίδι
116
- expected: Galaxídi
117
- - source: Γαλάτσι
118
- expected: Galátsi
119
- - source: Γιαννιτσά
120
- expected: Giannitsá
121
- - source: Γλυφάδα
122
- expected: Glyfáda
123
- - source: Γρανίτσα
124
- expected: Granítsa
125
- - source: Γρεβενά
126
- expected: Grevená
127
- - source: Γύθειο
128
- expected: Gýtheio
129
- - source: Διόνυσος
130
- expected: Diónysos
131
- - source: Δίστομο
132
- expected: Dístomo
133
- - source: Δολιανά
134
- expected: Dolianá
135
- - source: Δράμα
136
- expected: Dráma
137
- - source: Δωδεκάνησα
138
- expected: Dōdekánīsa
139
- - source: Έδεσσα
140
- expected: Édessa
141
- - source: Ελευσίνα
142
- expected: Eleusína
143
- - source: Επίδαυρος
144
- expected: Epídauros
145
- - source: Επτάνησα
146
- expected: Eptánīsa
147
- - source: Ερμούπολη
148
- expected: Ermoúpolī
149
- - source: Εύβοια
150
- expected: Eúvoia
151
- - source: Ζάκυνθος
152
- expected: Zákynthos
153
- - source: Ήπειρος
154
- expected: Ī́peiros
155
- - source: Ηράκλειο
156
- expected: Īrákleio
157
- - source: Θάσος
158
- expected: Thásos
159
- - source: Θεσσαλονίκη
160
- expected: Thessaloníkī
161
- - source: Θεσσαλία
162
- expected: Thessalía
163
- - source: Θεσπρωτία
164
- expected: Thesprōtía
165
- - source: Θήβα
166
- expected: Thī́va
167
- - source: Θράκη
168
- expected: Thrákī
169
- - source: Ιθάκη
170
- expected: Ithákī
171
- - source: Ίος
172
- expected: Íos
173
- - source: Ιωάννινα
174
- expected: Iōánnina
175
- - source: Καβάλα
176
- expected: Kavála
177
- - source: Καλάβρυτα
178
- expected: Kalávryta
179
- - source: Καλαμάτα
180
- expected: Kalamáta
181
- - source: Καλαμπάκα
182
- expected: Kalampáka
183
- - source: Καλύβια
184
- expected: Kalývia
185
- - source: Κάλυμνος
186
- expected: Kálymnos
187
- - source: Καρδίτσα
188
- expected: Kardítsa
189
- - source: Καρπενήσι
190
- expected: Karpenī́si
191
- - source: Κάρυστος
192
- expected: Kárystos
193
- - source: Καστελλόριζο
194
- expected: Kastellórizo
195
- - source: Καστοριά
196
- expected: Kastoriá
197
- - source: Κατερίνη
198
- expected: Katerínī
199
- - source: Κάτω Αχαΐα
200
- expected: Kátō Achaḯa
201
- - source: Κερατέα
202
- expected: Keratéa
203
- - source: Κέρκυρα
204
- expected: Kérkyra
205
- - source: Κεφαλλονιά
206
- expected: Kefalloniá
207
- - source: Κηφισιά
208
- expected: Kīfisiá
209
- - source: Κιλκίς
210
- expected: Kilkís
211
- - source: Κοζάνη
212
- expected: Kozánī
213
- - source: Κολωνός
214
- expected: Kolōnós
215
- - source: Κομοτηνή
216
- expected: Komotīnī́
217
- - source: Κόρινθος
218
- expected: Kórinthos
219
- - source: Κορώνη
220
- expected: Korṓnī
221
- - source: Κρανίδι
222
- expected: Kranídi
223
- - source: Κρέστενα
224
- expected: Kréstena
225
- - source: Κρήτη
226
- expected: Krī́tī
227
- - source: Κύθηρα
228
- expected: Kýthīra
229
- - source: Κυκλάδες
230
- expected: Kykládes
231
- - source: Κύμη
232
- expected: Kýmī
233
- - source: Κυψέλη
234
- expected: Kypsélī
235
- - source: Κως
236
- expected: Kōs
237
- - source: Λαγκαδάς
238
- expected: Lagkadás
239
- - source: Λαμία
240
- expected: Lamía
241
- - source: Λάρισα
242
- expected: Lárisa
243
- - source: Λαύριο
244
- expected: Laúrio
245
- - source: Λέρος
246
- expected: Léros
247
- - source: Λέσβος
248
- expected: Lésvos
249
- - source: Λευκάδα
250
- expected: Leukáda
251
- - source: Λήμνος
252
- expected: Lī́mnos
253
- - source: Λιβαδειά
254
- expected: Livadeiá
255
- - source: Μακεδονία
256
- expected: Makedonía
257
- - source: Μάνη
258
- expected: Mánī
259
- - source: Μαραθώνας
260
- expected: Marathṓnas
261
- - source: Μαρκόπουλο
262
- expected: Markópoulo
263
- - source: Μαρούσι
264
- expected: Maroúsi
265
- - source: Μέγαρα
266
- expected: Mégara
267
- - source: Μεσολόγγι
268
- expected: Mesológgi
269
- - source: Μεταξουργείο
270
- expected: Metaxourgeío
271
- - source: Μέτσοβο
272
- expected: Métsovo
273
- - source: Μήλος
274
- expected: Mī́los
275
- - source: Μύκονος
276
- expected: Mýkonos
277
- - source: Μυστράς
278
- expected: Mystrás
279
- - source: Μυτιλήνη
280
- expected: Mytilī́nī
281
- - source: Νάξος
282
- expected: Náxos
283
- - source: Νάουσα
284
- expected: Náousa
285
- - source: Ναύπακτος
286
- expected: Naúpaktos
287
- - source: Ναύπλιο
288
- expected: Naúplio
289
- - source: Νέα Σμύρνη
290
- expected: Néa Smýrnī
291
- - source: Νίσυρος
292
- expected: Nísyros
293
- - source: Ξάνθη
294
- expected: Xánthī
295
- - source: Όλυμπος
296
- expected: Ólympos
297
- - source: Παγκράτι
298
- expected: Pagkráti
299
- - source: Παπάγου
300
- expected: Papágou
301
- - source: Πάρος
302
- expected: Páros
303
- - source: Πασαλιμάνι
304
- expected: Pasalimáni
305
- - source: Πατήσια
306
- expected: Patī́sia
307
- - source: Πάτμος
308
- expected: Pátmos
309
- - source: Πάτρα
310
- expected: Pátra
311
- - source: Πειραιάς
312
- expected: Peiraiás
313
- - source: Πελοπόννησος
314
- expected: Pelopónnīsos
315
- - source: Περιστέρι
316
- expected: Peristéri
317
- - source: Πεύκη
318
- expected: Peúkī
319
- - source: Πήλιο
320
- expected: Pī́lio
321
- - source: Πολύγυρος
322
- expected: Polýgyros
323
- - source: Πόρος
324
- expected: Póros
325
- - source: Πρέβεζα
326
- expected: Préveza
327
- - source: Πτολεμαΐδα
328
- expected: Ptolemaḯda
329
- - source: Πύλος
330
- expected: Pýlos
331
- - source: Πύργος
332
- expected: Pýrgos
333
- - source: Ρέθυμνο
334
- expected: Réthymno
335
- - source: Ρόδος
336
- expected: Ródos
337
- - source: Ρούμελη
338
- expected: Roúmelī
339
- - source: Σαλαμίνα
340
- expected: Salamína
341
- - source: Σαμοθράκη
342
- expected: Samothrákī
343
- - source: Σάμος
344
- expected: Sámos
345
- - source: Σαντορίνη
346
- expected: Santorínī
347
- - source: Σέρρες
348
- expected: Sérres
349
- - source: Σίκινος
350
- expected: Síkinos
351
- - source: Σίφνος
352
- expected: Sífnos
353
- - source: Σκιάθος
354
- expected: Skiáthos
355
- - source: Σκόπελος
356
- expected: Skópelos
357
- - source: Σούλι
358
- expected: Soúli
359
- - source: Σπάρτη
360
- expected: Spártī
361
- - source: Στερεά Ελλάδα
362
- expected: Stereá Elláda
363
- - source: Στύρα
364
- expected: Stýra
365
- - source: Σύμη
366
- expected: Sýmī
367
- - source: Σύρος
368
- expected: Sýros
369
- - source: Σφακιά
370
- expected: Sfakiá
371
- - source: Τήλος
372
- expected: Tī́los
373
- - source: Τήνος
374
- expected: Tī́nos
375
- - source: Τρίκαλα
376
- expected: Tríkala
377
- - source: Τρίπολη
378
- expected: Trípolī
379
- - source: Τσακωνιά
380
- expected: Tsakōniá
381
- - source: Ύδρα
382
- expected: Ýdra
383
- - source: Φάληρο
384
- expected: Fálīro
385
- - source: Φλώρινα
386
- expected: Flṓrina
387
- - source: Φολέγανδρος
388
- expected: Folégandros
389
- - source: Χάλκη
390
- expected: Chálkī
391
- - source: Χαλκίδα
392
- expected: Chalkída
393
- - source: Χαλάνδρι
394
- expected: Chalándri
395
- - source: Χαλκιδική
396
- expected: Chalkidikī́
397
- - source: Χανιά
398
- expected: Chaniá
399
- - source: Χίος
400
- expected: Chíos
401
- - source: Ψαρά
402
- expected: Psará
403
- - source: Αβάνα
404
- expected: Avána
405
- - source: Αγγλία
406
- expected: Agglía
407
- - source: Αϊβαλί
408
- expected: Aïvalí
409
- - source: Αλεξάνδρεια
410
- expected: Alexándreia
411
- - source: Άμστερνταμ
412
- expected: Ámsterntam
413
- - source: Βαυαρία
414
- expected: Vauaría
415
- - source: Βενετία
416
- expected: Venetía
417
- - source: Βερολίνο
418
- expected: Verolíno
419
- - source: Βερόνα
420
- expected: Veróna
421
- - source: Βιέννη
422
- expected: Viénnī
423
- - source: Γένοβα
424
- expected: Génova
425
- - source: Δουβλίνο
426
- expected: Douvlíno
427
- - source: Καλαβρία
428
- expected: Kalavría
429
- - source: Καλιφόρνια
430
- expected: Kalifórnia
431
- - source: Καύκασος
432
- expected: Kaúkasos
433
- - source: Κονγκό
434
- expected: Kongkó
435
- - source: Κορσική
436
- expected: Korsikī́
437
- - source: Κουρδιστάν
438
- expected: Kourdistán
439
- - source: Κωνσταντινούπολη
440
- expected: Kōnstantinoúpolī
441
- - source: Κατεχόμενη Κύπρος
442
- expected: Katechómenī Kýpros
443
- - source: Λαπωνία
444
- expected: Lapōnía
445
- - source: Λευκωσία
446
- expected: Leukōsía
447
- - source: Λιβόρνο
448
- expected: Livórno
449
- - source: Λονδίνο
450
- expected: Londíno
451
- - source: Λυών
452
- expected: Lyṓn
453
- - source: Μάλαγα
454
- expected: Málaga
455
- - source: Μασσαλία
456
- expected: Massalía
457
- - source: Μικρονησία
458
- expected: Mikronīsía
459
- - source: Μιλάνο
460
- expected: Miláno
461
- - source: Μόσχα
462
- expected: Móscha
463
- - source: Μπολόνια
464
- expected: Mpolónia
465
- - source: Νάπολη
466
- expected: Nápolī
467
- - source: Νταγκεστάν
468
- expected: Ntagkestán
469
- - source: Νέα Υόρκη
470
- expected: Néa Yórkī
471
- - source: Οξφόρδη
472
- expected: Oxfórdī
473
- - source: Ουαλία
474
- expected: Oualía
475
- - source: Παρίσι
476
- expected: Parísi
477
- - source: Πάφος
478
- expected: Páfos
479
- - source: Πολυνησία
480
- expected: Polynīsía
481
- - source: Ρώμη
482
- expected: Rṓmī
483
- - source: Σαμάρεια
484
- expected: Samáreia
485
- - source: Σικελία
486
- expected: Sikelía
487
- - source: Σκανδιναβία
488
- expected: Skandinavía
489
- - source: Σκόπια
490
- expected: Skópia
491
- - source: Σκωτία
492
- expected: Skōtía
493
- - source: Σμύρνη
494
- expected: Smýrnī
495
- - source: Ταϊτή
496
- expected: Taïtī́
497
- - source: Ταταρστάν
498
- expected: Tatarstán
499
- - source: Τζαμάικα
500
- expected: Tzamáika
501
- - source: Τηλλυρία
502
- expected: Tīllyría
503
- - source: Τιρόλο
504
- expected: Tirólo
505
- - source: Τορίνο
506
- expected: Toríno
507
- - source: Φανάρι
508
- expected: Fanári
509
- - source: Φλωρεντία
510
- expected: Flōrentía
511
- - source: Χαβάη
512
- expected: Chaváī
513
- - source: Χονγκ Κονγκ
514
- expected: Chongk Kongk
515
-
516
- map:
517
- # https://en.wikipedia.org/wiki/Romanization_of_Greek
518
- rules:
519
- - pattern: (?<=[ΑαΕεΟο])\u03A5 # Υ (after Α, Ε, Η)
520
- result: U
521
- - pattern: (?<=[ΑαΕεΟο])\u03C5 # υ (after Α, Ε, Η)
522
- result: u
523
- - pattern: (?<=[ΑαΕεΟο])\u03CD # ύ (after Ο)
524
- result: ú
525
- - pattern: \u037E # ;
526
- result: "?"
527
- - pattern: \u003B # ;
528
- result: "?"
529
-
530
- characters:
531
- "\u0027": ""
532
- "\u0386": "Á" # Ά
533
- "\u0391": "A" # Α
534
- "\u0392": "V" # Β
535
- "\u0393": "G" # Γ
536
- "\u0394": "D" # Δ
537
- "\u0395": "E" # Ε
538
- "\u0396": "Z" # Ζ
539
- "\u0397": "Ī" # Η
540
- "\u0398": "Th" # Θ
541
- "\u0399": "I" # Ι
542
- "\u039A": "K" # Κ
543
- "\u039B": "L" # Λ
544
- "\u039C": "M" # Μ
545
- "\u039D": "N" # Ν
546
- "\u039E": "X" # Ξ
547
- "\u039F": "O" # Ο
548
- "\u03A0": "P" # Π
549
- "\u03A1": "R" # Ρ
550
- "\u03A3": "S" # Σ
551
- "\u03A4": "T" # Τ
552
- "\u03A5": "Y" # Υ
553
- "\u03A6": "F" # Φ
554
- "\u03A7": "Ch" # Χ
555
- "\u03A8": "Ps" # Ψ
556
- "\u03A9": "Ō" # Ω
557
- "\u0388": "É" # Έ
558
- "\u0389": "Ī́" # Ή
559
- "\u038A": "Í" # Ί
560
- "\u038C": "Ó" # Ό
561
- "\u038E": "Ý" # Ύ
562
- "\u038F": "Ṓ" # Ώ
563
- "\u03AA": "Ï" # Ϊ
564
- "\u03AB": "Ÿ" # Ϋ
565
-
566
- "\u03AC": "á" # ά
567
- "\u03B1": "a" # α
568
- "\u03B2": "v" # β
569
- "\u03B3": "g" # γ
570
- "\u03B4": "d" # δ
571
- "\u03B5": "e" # ε
572
- "\u03B6": "z" # ζ
573
- "\u03B7": "ī" # η
574
- "\u03B8": "th" # θ
575
- "\u03B9": "i" # ι
576
- "\u03BA": "k" # κ
577
- "\u03BB": "l" # λ
578
- "\u03BC": "m" # μ
579
- "\u03BD": "n" # ν
580
- "\u03BE": "x" # ξ
581
- "\u03BF": "o" # ο
582
- "\u03C0": "p" # π
583
- "\u03C1": "r" # ρ
584
- "\u03C3": "s" # σ
585
- "\u03C2": "s" # ς
586
- "\u03C4": "t" # τ
587
- "\u03C5": "y" # υ
588
- "\u03C6": "f" # φ
589
- "\u03C7": "ch" # χ
590
- "\u03C8": "ps" # ψ
591
- "\u03C9": "ō" # ω
592
- "\u03AD": "é" # έ
593
- "\u03AE": "ī́" # ή
594
- "\u03AF": "í" # ί
595
- "\u03CC": "ó" # ό
596
- "\u03CD": "ý" # ύ
597
- "\u03CE": "ṓ" # ώ
598
- "\u03CA": "ï" # ϊ
599
- "\u03CB": "ÿ" # ϋ
600
- "\u0390": "ḯ" # ΐ
601
- "\u03B0": "ÿ́" # ΰ
602
-
603
- "\u03DC": "W" # Ϝ
604
- "\u03DD": "w" # ϝ
605
- "\u03F2": "s" # ϲ
606
- "\u03F9": "S" # Ϲ
607
-
608
- "\u0387": ";" # ·
609
- "\u00B7": ";" # ·