interscript 0.1.2 → 0.1.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -0,0 +1,115 @@
1
+ ---
2
+ authority_id: by
3
+ id: 2007
4
+ language: bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: REGULATORY LEGAL ACTS OF THE NATIONAL BANK, NATIONAL ACADEMY OF SCIENCES OF BELARUS, MINISTRIES, OTHER REPUBLICAN GOVERNMENT BODIES 8/16668
8
+ url: http://www.pravo.by/pdf/2007-159/2007-159(027-028).pdf
9
+ creation_date: 2007
10
+ description: |
11
+ RESOLUTION OF THE STATE COMMITTEE
12
+ ON PROPERTY OF THE REPUBLIC OF BELARUS June 11, 2007 No. 38
13
+
14
+ 8/16668 (06/18/2007) On amendments and additions to the Instructions
15
+ for the transliteration of geographical names of the
16
+ Republic of Belarus in letters of the Latin alphabet
17
+
18
+ Based on the Regulation on the State Property Committee of the Republic of Belarus,
19
+ approved by the Decree of the Council of Ministers of the Republic of Belarusdated July 29, 2006
20
+ No. 958 "Issues of the State Committee on Property of the Republic of Belarus"
21
+
22
+ tests:
23
+ - source: Аршанскi
24
+ expected: Aršanski
25
+ - source: Бешанковічы
26
+ expected: Biešankovičy
27
+ - source: Віцебск
28
+ expected: Viciebsk
29
+ - source: Гомель
30
+ expected: Homieĺ
31
+ - source: Гаўя
32
+ expected: Haŭja
33
+ - source: Добруш
34
+ expected: Dobruš
35
+ - source: Ельск
36
+ expected: Jeĺsk
37
+ - source: Бабаедава
38
+ expected: Babajedava
39
+ - source: Венцавічы
40
+ expected: Viencavičy
41
+ - source: Ёды
42
+ expected: Jody
43
+ - source: Вераб'ёвічы
44
+ expected: Vierabjovičy
45
+ - source: Мёры
46
+ expected: Miory
47
+ - source: Зэльва
48
+ expected: Zeĺva
49
+ - source: Iванава
50
+ expected: Ivanava
51
+ - source: Iўе
52
+ expected: Iŭje
53
+ - source: Лагойск
54
+ expected: Lahojsk
55
+ - source: Круглае
56
+ expected: Kruhlaje
57
+ - source: Лошыца
58
+ expected: Lošyca
59
+ - source: Любань
60
+ expected: Liubań
61
+ - source: Магілёў
62
+ expected: Mahilioŭ
63
+ - source: Нясвіж
64
+ expected: Niasviž
65
+ - source: Орша
66
+ expected: Orša
67
+ - source: Паставы
68
+ expected: Pastavy
69
+ - source: Рагачоў
70
+ expected: Rahačoŭ
71
+ - source: Смаргонь
72
+ expected: Smarhoń
73
+ - source: Талачын
74
+ expected: Talačyn
75
+ - source: Узда
76
+ expected: Uzda
77
+ - source: Шаркаўшчына
78
+ expected: Šarkaŭščyna
79
+ - source: Фаніпаль
80
+ expected: Fanipaĺ
81
+ - source: Хоцімск
82
+ expected: Chocimsk
83
+ - source: Цёмны Лес
84
+ expected: Ciomny Lies
85
+ - source: Чавусы
86
+ expected: Čavusy
87
+ - source: Шумілiна
88
+ expected: Šumilina
89
+ - source: Чыгірынка
90
+ expected: Čyhirynka
91
+ - source: Чэрвень
92
+ expected: Červień
93
+ - source: Друць
94
+ expected: Druć
95
+ - source: Чачэрск
96
+ expected: Čačersk
97
+ - source: Юхнаўка
98
+ expected: Juchnaŭka
99
+ - source: Гаюціна
100
+ expected: Hajucina
101
+ - source: Цюрлі
102
+ expected: Ciurli
103
+ - source: Любонічы
104
+ expected: Liuboničy
105
+ - source: Ямнае
106
+ expected: Jamnaje
107
+ - source: Баяры
108
+ expected: Bajary
109
+ - source: Валяр'яны
110
+ expected: Valiarjany
111
+ - source: Вязынка
112
+ expected: Viazynka
113
+
114
+ map:
115
+ inherit: by-bel-Cyrl-Latn-1998
@@ -0,0 +1,685 @@
1
+ ---
2
+ authority_id: un
3
+ id: 1982
4
+ language: ell
5
+ source_script: Grek
6
+ destination_script: Latn
7
+ name: ELOT 743:1982 (transliteration)
8
+ url:
9
+ creation_date: 1982
10
+ description: |
11
+ ELOT 743:1982 transliteration table for Greek
12
+
13
+ note:
14
+ - This was the intended system in ELOT 743:1982 for transliteration, as is apparent from un-ell-Grek-Latn-1987-tl and iso-ell-Grek-Latn-843-1997-t2, and ELOT 743:2001, Annex B; but the reversible character diacritics are missing from the currently available document, and the document does not indicate what there was supposed to be.
15
+ - "\"Transliteration\" as used in this specification and its inheritors refers to reversible transliteration, as distinct from \"transcription\", which is a simpler transliteration and which is intended for default use."
16
+
17
+ tests:
18
+ - source: |
19
+ Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
20
+
21
+ Γιάννης Μακρυγιάννης.
22
+
23
+ expected: |
24
+ Éna práma mónon me parakíni̱se ki eména na grápso̱ óti toúti̱n ti̱n patrída ti̱n échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai fto̱choí kai politikoí kai stratio̱tikoí kai oi pléon mikróteroi ánthro̱poi; ósoi ago̱nistí̱kamen, analógo̱s o katheís, échomen na zí̱somen edó̱. To loipón doulépsamen óloi mazí, na ti̱n fylámen ki óloi mazí kai na mi̱n légei oúte o dynatós «egó̱» oúte o adýnatos. Xérete póte na légei o katheís «egó̱»? Ótan ago̱nisteí mónos tou kai fkiásei í̱ chalásei, na légei «egó̱»; ótan ómo̱s ago̱nízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egó̱». Kai eis to exí̱s na máthomen gnó̱si̱, an thélomen na fkiásomen cho̱rión, na zí̱somen óloi mazí.
25
+
26
+ Giánni̱s Makrygiánni̱s.
27
+
28
+
29
+ - source: ΑΘΗΝΑ
30
+ expected: ATHI̱NA
31
+ - source: μπαμπάκι
32
+ expected: bampáki
33
+ - source: νταντά
34
+ expected: ntantá
35
+ - source: γκέγκε
36
+ expected: gkégke
37
+ - source: Γκαμπόν
38
+ expected: Gkampón
39
+ - source: Μάγχη
40
+ expected: Máṉchi̱
41
+ - source: κογξ
42
+ expected: koṉx
43
+ - source: υιός
44
+ expected: yiós
45
+ - source: Υιός
46
+ expected: Yiós
47
+ - source: νεράντζι
48
+ expected: nerántzi
49
+ - source: Γοίθιος
50
+ expected: Goíthios
51
+ - source: μπέικον
52
+ expected: béïkon
53
+ - source: μπέϊκον
54
+ expected: béïkon
55
+ - source: βόλεϊ
56
+ expected: vóleï
57
+ - source: αθεΐα
58
+ expected: atheḯa
59
+ - source: Εϊγιαφιάτλαγιοκουτλ
60
+ expected: Eïgiafiátlagiokoutl
61
+ - source: Εΐτζι
62
+ expected: Eḯtzi
63
+ - source: Μυρτώο
64
+ expected: Myrtó̱o
65
+ - source: αέρας
66
+ expected: aéras
67
+ - source: γαυ γαυ
68
+ expected: gaf̱ gaf̱
69
+ - source: Ταΰγετος
70
+ expected: Taÿ́getos
71
+ - source: σπρέυ
72
+ expected: spréy
73
+
74
+ - source: Αθήνα
75
+ expected: Athí̱na
76
+ - source: Άγιον Όρος
77
+ expected: Ágion Óros
78
+ - source: Άγραφα
79
+ expected: Ágrafa
80
+ - source: Αγρίνιο
81
+ expected: Agrínio
82
+ - source: Αίγινα
83
+ expected: Aígina
84
+ - source: Αίγιο
85
+ expected: Aígio
86
+ - source: Αλεξανδρούπολη
87
+ expected: Alexandroúpoli̱
88
+ - source: Αλεποχώρι
89
+ expected: Alepochó̱ri
90
+ - source: Αμοργός
91
+ expected: Amorgós
92
+ - source: Άμφισσα
93
+ expected: Ámfissa
94
+ - source: Αράχωβα
95
+ expected: Arácho̱va
96
+ - source: Άργος
97
+ expected: Árgos
98
+ - source: Αρκαδία
99
+ expected: Arkadía
100
+ - source: Άρτα
101
+ expected: Árta
102
+ - source: Βελούχι
103
+ expected: Veloúchi
104
+ - source: Βέροια
105
+ expected: Véroia
106
+ - source: Βοιωτία
107
+ expected: Voio̱tía
108
+ - source: Βόλος
109
+ expected: Vólos
110
+ - source: Βόνιτσα
111
+ expected: Vónitsa
112
+ - source: Γαλαξίδι
113
+ expected: Galaxídi
114
+ - source: Γαλάτσι
115
+ expected: Galátsi
116
+ - source: Γιαννιτσά
117
+ expected: Giannitsá
118
+ - source: Γλυφάδα
119
+ expected: Glyfáda
120
+ - source: Γρανίτσα
121
+ expected: Granítsa
122
+ - source: Γρεβενά
123
+ expected: Grevená
124
+ - source: Γύθειο
125
+ expected: Gýtheio
126
+ - source: Διόνυσος
127
+ expected: Diónysos
128
+ - source: Δίστομο
129
+ expected: Dístomo
130
+ - source: Δολιανά
131
+ expected: Dolianá
132
+ - source: Δράμα
133
+ expected: Dráma
134
+ - source: Δωδεκάνησα
135
+ expected: Do̱dekáni̱sa
136
+ - source: Έδεσσα
137
+ expected: Édessa
138
+ - source: Ελευσίνα
139
+ expected: Elef̱sína
140
+ - source: Επίδαυρος
141
+ expected: Epídav̱ros
142
+ - source: Επτάνησα
143
+ expected: Eptáni̱sa
144
+ - source: Ερμούπολη
145
+ expected: Ermoúpoli̱
146
+ - source: Εύβοια
147
+ expected: Év̱voia
148
+ - source: Ζάκυνθος
149
+ expected: Zákynthos
150
+ - source: Ήπειρος
151
+ expected: Í̱peiros
152
+ - source: Ηράκλειο
153
+ expected: I̱rákleio
154
+ - source: Θάσος
155
+ expected: Thásos
156
+ - source: Θεσσαλονίκη
157
+ expected: Thessaloníki̱
158
+ - source: Θεσσαλία
159
+ expected: Thessalía
160
+ - source: Θεσπρωτία
161
+ expected: Thespro̱tía
162
+ - source: Θήβα
163
+ expected: Thí̱va
164
+ - source: Θράκη
165
+ expected: Thráki̱
166
+ - source: Ιθάκη
167
+ expected: Itháki̱
168
+ - source: Ίος
169
+ expected: Íos
170
+ - source: Ιωάννινα
171
+ expected: Io̱ánnina
172
+ - source: Καβάλα
173
+ expected: Kavála
174
+ - source: Καλάβρυτα
175
+ expected: Kalávryta
176
+ - source: Καλαμάτα
177
+ expected: Kalamáta
178
+ - source: Καλαμπάκα
179
+ expected: Kalampáka
180
+ - source: Καλύβια
181
+ expected: Kalývia
182
+ - source: Κάλυμνος
183
+ expected: Kálymnos
184
+ - source: Καρδίτσα
185
+ expected: Kardítsa
186
+ - source: Καρπενήσι
187
+ expected: Karpení̱si
188
+ - source: Κάρυστος
189
+ expected: Kárystos
190
+ - source: Καστελλόριζο
191
+ expected: Kastellórizo
192
+ - source: Καστοριά
193
+ expected: Kastoriá
194
+ - source: Κατερίνη
195
+ expected: Kateríni̱
196
+ - source: Κάτω Αχαΐα
197
+ expected: Káto̱ Achaḯa
198
+ - source: Κερατέα
199
+ expected: Keratéa
200
+ - source: Κέρκυρα
201
+ expected: Kérkyra
202
+ - source: Κεφαλλονιά
203
+ expected: Kefalloniá
204
+ - source: Κηφισιά
205
+ expected: Ki̱fisiá
206
+ - source: Κιλκίς
207
+ expected: Kilkís
208
+ - source: Κοζάνη
209
+ expected: Kozáni̱
210
+ - source: Κολωνός
211
+ expected: Kolo̱nós
212
+ - source: Κομοτηνή
213
+ expected: Komoti̱ní̱
214
+ - source: Κόρινθος
215
+ expected: Kórinthos
216
+ - source: Κορώνη
217
+ expected: Koró̱ni̱
218
+ - source: Κρανίδι
219
+ expected: Kranídi
220
+ - source: Κρέστενα
221
+ expected: Kréstena
222
+ - source: Κρήτη
223
+ expected: Krí̱ti̱
224
+ - source: Κύθηρα
225
+ expected: Kýthi̱ra
226
+ - source: Κυκλάδες
227
+ expected: Kykládes
228
+ - source: Κύμη
229
+ expected: Kými̱
230
+ - source: Κυψέλη
231
+ expected: Kypséli̱
232
+ - source: Κως
233
+ expected: Ko̱s
234
+ - source: Λαγκαδάς
235
+ expected: Lagkadás
236
+ - source: Λαμία
237
+ expected: Lamía
238
+ - source: Λάρισα
239
+ expected: Lárisa
240
+ - source: Λαύριο
241
+ expected: Láv̱rio
242
+ - source: Λέρος
243
+ expected: Léros
244
+ - source: Λέσβος
245
+ expected: Lésvos
246
+ - source: Λευκάδα
247
+ expected: Lef̱káda
248
+ - source: Λήμνος
249
+ expected: Lí̱mnos
250
+ - source: Λιβαδειά
251
+ expected: Livadeiá
252
+ - source: Μακεδονία
253
+ expected: Makedonía
254
+ - source: Μάνη
255
+ expected: Máni̱
256
+ - source: Μαραθώνας
257
+ expected: Marathó̱nas
258
+ - source: Μαρκόπουλο
259
+ expected: Markópoulo
260
+ - source: Μαρούσι
261
+ expected: Maroúsi
262
+ - source: Μέγαρα
263
+ expected: Mégara
264
+ - source: Μεσολόγγι
265
+ expected: Mesolóṉgi
266
+ - source: Μεταξουργείο
267
+ expected: Metaxourgeío
268
+ - source: Μέτσοβο
269
+ expected: Métsovo
270
+ - source: Μήλος
271
+ expected: Mí̱los
272
+ - source: Μύκονος
273
+ expected: Mýkonos
274
+ - source: Μυστράς
275
+ expected: Mystrás
276
+ - source: Μυτιλήνη
277
+ expected: Mytilí̱ni̱
278
+ - source: Νάξος
279
+ expected: Náxos
280
+ - source: Νάουσα
281
+ expected: Náousa
282
+ - source: Ναύπακτος
283
+ expected: Náf̱paktos
284
+ - source: Ναύπλιο
285
+ expected: Náf̱plio
286
+ - source: Νέα Σμύρνη
287
+ expected: Néa Smýrni̱
288
+ - source: Νίσυρος
289
+ expected: Nísyros
290
+ - source: Ξάνθη
291
+ expected: Xánthi̱
292
+ - source: Όλυμπος
293
+ expected: Ólympos
294
+ - source: Παγκράτι
295
+ expected: Pagkráti
296
+ - source: Παπάγου
297
+ expected: Papágou
298
+ - source: Πάρος
299
+ expected: Páros
300
+ - source: Πασαλιμάνι
301
+ expected: Pasalimáni
302
+ - source: Πατήσια
303
+ expected: Patí̱sia
304
+ - source: Πάτμος
305
+ expected: Pátmos
306
+ - source: Πάτρα
307
+ expected: Pátra
308
+ - source: Πειραιάς
309
+ expected: Peiraiás
310
+ - source: Πελοπόννησος
311
+ expected: Pelopónni̱sos
312
+ - source: Περιστέρι
313
+ expected: Peristéri
314
+ - source: Πεύκη
315
+ expected: Péf̱ki̱
316
+ - source: Πήλιο
317
+ expected: Pí̱lio
318
+ - source: Πολύγυρος
319
+ expected: Polýgyros
320
+ - source: Πόρος
321
+ expected: Póros
322
+ - source: Πρέβεζα
323
+ expected: Préveza
324
+ - source: Πτολεμαΐδα
325
+ expected: Ptolemaḯda
326
+ - source: Πύλος
327
+ expected: Pýlos
328
+ - source: Πύργος
329
+ expected: Pýrgos
330
+ - source: Ρέθυμνο
331
+ expected: Réthymno
332
+ - source: Ρόδος
333
+ expected: Ródos
334
+ - source: Ρούμελη
335
+ expected: Roúmeli̱
336
+ - source: Σαλαμίνα
337
+ expected: Salamína
338
+ - source: Σαμοθράκη
339
+ expected: Samothráki̱
340
+ - source: Σάμος
341
+ expected: Sámos
342
+ - source: Σαντορίνη
343
+ expected: Santoríni̱
344
+ - source: Σέρρες
345
+ expected: Sérres
346
+ - source: Σίκινος
347
+ expected: Síkinos
348
+ - source: Σίφνος
349
+ expected: Sífnos
350
+ - source: Σκιάθος
351
+ expected: Skiáthos
352
+ - source: Σκόπελος
353
+ expected: Skópelos
354
+ - source: Σούλι
355
+ expected: Soúli
356
+ - source: Σπάρτη
357
+ expected: Spárti̱
358
+ - source: Στερεά Ελλάδα
359
+ expected: Stereá Elláda
360
+ - source: Στύρα
361
+ expected: Stýra
362
+ - source: Σύμη
363
+ expected: Sými̱
364
+ - source: Σύρος
365
+ expected: Sýros
366
+ - source: Σφακιά
367
+ expected: Sfakiá
368
+ - source: Τήλος
369
+ expected: Tí̱los
370
+ - source: Τήνος
371
+ expected: Tí̱nos
372
+ - source: Τρίκαλα
373
+ expected: Tríkala
374
+ - source: Τρίπολη
375
+ expected: Trípoli̱
376
+ - source: Τσακωνιά
377
+ expected: Tsako̱niá
378
+ - source: Ύδρα
379
+ expected: Ýdra
380
+ - source: Φάληρο
381
+ expected: Fáli̱ro
382
+ - source: Φλώρινα
383
+ expected: Fló̱rina
384
+ - source: Φολέγανδρος
385
+ expected: Folégandros
386
+ - source: Χάλκη
387
+ expected: Chálki̱
388
+ - source: Χαλκίδα
389
+ expected: Chalkída
390
+ - source: Χαλάνδρι
391
+ expected: Chalándri
392
+ - source: Χαλκιδική
393
+ expected: Chalkidikí̱
394
+ - source: Χανιά
395
+ expected: Chaniá
396
+ - source: Χίος
397
+ expected: Chíos
398
+ - source: Ψαρά
399
+ expected: Psará
400
+ - source: Αβάνα
401
+ expected: Avána
402
+ - source: Αγγλία
403
+ expected: Aṉglía
404
+ - source: Αϊβαλί
405
+ expected: Aïvalí
406
+ - source: Αλεξάνδρεια
407
+ expected: Alexándreia
408
+ - source: Άμστερνταμ
409
+ expected: Ámsterntam
410
+ - source: Βαυαρία
411
+ expected: Vav̱aría
412
+ - source: Βενετία
413
+ expected: Venetía
414
+ - source: Βερολίνο
415
+ expected: Verolíno
416
+ - source: Βερόνα
417
+ expected: Veróna
418
+ - source: Βιέννη
419
+ expected: Viénni̱
420
+ - source: Γένοβα
421
+ expected: Génova
422
+ - source: Δουβλίνο
423
+ expected: Douvlíno
424
+ - source: Καλαβρία
425
+ expected: Kalavría
426
+ - source: Καλιφόρνια
427
+ expected: Kalifórnia
428
+ - source: Καύκασος
429
+ expected: Káf̱kasos
430
+ - source: Κονγκό
431
+ expected: Kongkó
432
+ - source: Κορσική
433
+ expected: Korsikí̱
434
+ - source: Κουρδιστάν
435
+ expected: Kourdistán
436
+ - source: Κωνσταντινούπολη
437
+ expected: Ko̱nstantinoúpoli̱
438
+ - source: Κατεχόμενη Κύπρος
439
+ expected: Katechómeni̱ Kýpros
440
+ - source: Λαπωνία
441
+ expected: Lapo̱nía
442
+ - source: Λευκωσία
443
+ expected: Lef̱ko̱sía
444
+ - source: Λιβόρνο
445
+ expected: Livórno
446
+ - source: Λονδίνο
447
+ expected: Londíno
448
+ - source: Λυών
449
+ expected: Lyó̱n
450
+ - source: Μάλαγα
451
+ expected: Málaga
452
+ - source: Μασσαλία
453
+ expected: Massalía
454
+ - source: Μικρονησία
455
+ expected: Mikroni̱sía
456
+ - source: Μιλάνο
457
+ expected: Miláno
458
+ - source: Μόσχα
459
+ expected: Móscha
460
+ - source: Μπολόνια
461
+ expected: Bolónia
462
+ - source: Νάπολη
463
+ expected: Nápoli̱
464
+ - source: Νταγκεστάν
465
+ expected: Ntagkestán
466
+ - source: Νέα Υόρκη
467
+ expected: Néa Yórki̱
468
+ - source: Οξφόρδη
469
+ expected: Oxfórdi̱
470
+ - source: Ουαλία
471
+ expected: Oualía
472
+ - source: Παρίσι
473
+ expected: Parísi
474
+ - source: Πάφος
475
+ expected: Páfos
476
+ - source: Πολυνησία
477
+ expected: Polyni̱sía
478
+ - source: Ρώμη
479
+ expected: Ró̱mi̱
480
+ - source: Σαμάρεια
481
+ expected: Samáreia
482
+ - source: Σικελία
483
+ expected: Sikelía
484
+ - source: Σκανδιναβία
485
+ expected: Skandinavía
486
+ - source: Σκόπια
487
+ expected: Skópia
488
+ - source: Σκωτία
489
+ expected: Sko̱tía
490
+ - source: Σμύρνη
491
+ expected: Smýrni̱
492
+ - source: Ταϊτή
493
+ expected: Taïtí̱
494
+ - source: Ταταρστάν
495
+ expected: Tatarstán
496
+ - source: Τζαμάικα
497
+ expected: Tzamáika
498
+ - source: Τηλλυρία
499
+ expected: Ti̱llyría
500
+ - source: Τιρόλο
501
+ expected: Tirólo
502
+ - source: Τορίνο
503
+ expected: Toríno
504
+ - source: Φανάρι
505
+ expected: Fanári
506
+ - source: Φλωρεντία
507
+ expected: Flo̱rentía
508
+ - source: Χαβάη
509
+ expected: Chavái̱
510
+ - source: Χονγκ Κονγκ
511
+ expected: Chongk Kongk
512
+
513
+ map:
514
+ # https://en.wikipedia.org/wiki/Romanization_of_Greek
515
+ rules:
516
+ - pattern: (?<=[ΑαΕεΗη])\u03A5(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Υ (after Α, Ε, Η)
517
+ result: F̱
518
+ - pattern: (?<=[ΑαΕεΗη])\u03A5(?=\b) # Υ (after Α, Ε, Η)
519
+ result: F̱
520
+ - pattern: (?<=[ΑαΕεΗη])\u03C5(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # υ (after Α, Ε, Η)
521
+ result: f̱
522
+ - pattern: (?<=[ΑαΕεΗη])\u03C5(?=\b) # υ (after Α, Ε, Η)
523
+ result: f̱
524
+ - pattern: (?<=[ΑαΕεΗη])\u03A5(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Υ (after Α, Ε, Η)
525
+ result: V̱
526
+ - pattern: (?<=[ΑαΕεΗη])\u03C5(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # υ (after Α, Ε, Η)
527
+ result: v̱
528
+ - pattern: \u0391\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Αύ
529
+ result: Áf̱
530
+ - pattern: \u0391\u03CD(?=\b) # Αύ
531
+ result: Áf̱
532
+ - pattern: \u0391\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Αύ
533
+ result: Áv̱
534
+ - pattern: \u03B1\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Αύ
535
+ result: áf̱
536
+ - pattern: \u03B1\u03CD(?=\b) # Αύ
537
+ result: áf̱
538
+ - pattern: \u03B1\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Αύ
539
+ result: áv̱
540
+ - pattern: \u0395\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
541
+ result: Éf̱
542
+ - pattern: \u0395\u03CD(?=\b) # Εύ
543
+ result: Éf̱
544
+ - pattern: \u0395\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Εύ
545
+ result: Év̱
546
+ - pattern: \u03B5\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
547
+ result: éf̱
548
+ - pattern: \u03B5\u03CD(?=\b) # Εύ
549
+ result: éf̱
550
+ - pattern: \u03B5\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Εύ
551
+ result: év̱
552
+ - pattern: \u0397\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
553
+ result: Í̱f̱
554
+ - pattern: \u0397\u03CD(?=\b) # Εύ
555
+ result: Í̱f̱
556
+ - pattern: \u0397\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Εύ
557
+ result: Í̱v̱
558
+ - pattern: \u03B7\u03CD(?=[θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]) # Εύ
559
+ result: í̱f̱
560
+ - pattern: \u03B7\u03CD(?=\b) # Εύ
561
+ result: í̱f̱
562
+ - pattern: \u03B7\u03CD(?![θΘκΚξΞπΠσΣςτΤφΦχΧψΨ]|\b) # Εύ
563
+ result: í̱v̱
564
+ - pattern: (?<=[Οο])\u03A5 # Υ (after Ο)
565
+ result: U
566
+ - pattern: (?<=[Οο])\u03C5 # υ (after Ο)
567
+ result: u
568
+ - pattern: (?<=[Οο])\u03CD # ύ (after Ο)
569
+ result: ú
570
+ - pattern: (?<=[ΆάΈέΉήΌό])\u03A5 # Άυ, Έυ, Ήυ, Όυ
571
+ result: Υ
572
+ - pattern: (?<=[ΆάΈέΉήΌό])\u03C5 # Άυ, Έυ, Ήυ, Όυ
573
+ result: y
574
+ - pattern: \u0393(?=[ξΞχΧ]) # Γ (before Γ, Ξ, Χ)
575
+ result: Ṉ
576
+ - pattern: \u03B3(?=[ξΞχΧ]) # γ (before Γ, Ξ, Χ)
577
+ result: ṉ
578
+ - pattern: \u0393[Γγ] # Γ (before Γ)
579
+ result: Ṉg
580
+ - pattern: \u03B3\u03B3 # γ (before Γ)
581
+ result: ṉg
582
+ - pattern: \u0393[Κκ] # Γ (before Κ)
583
+ result: Gk
584
+ - pattern: \u03B3[Κκ] # γ (before Κ)
585
+ result: gk
586
+ - pattern: (?<=\b)\u039C[πΠ] # ΜΠ (initially)
587
+ result: B
588
+ - pattern: (?<=\b)\u03BC[πΠ] # μπ (initially)
589
+ result: b
590
+ - pattern: \u039C[πΠ](?=\b) # ΜΠ (finally)
591
+ result: B
592
+ - pattern: \u03BC[πΠ](?=\b) # μπ (finally)
593
+ result: b
594
+ - pattern: (?<!\b)\u039C[πΠ] # ΜΠ (medially)
595
+ result: Mp
596
+ - pattern: (?<!\b)\u03BC[πΠ] # μπ (medially)
597
+ result: mp
598
+ - pattern: \u037E # ;
599
+ result: "?"
600
+ - pattern: \u003B # ;
601
+ result: "?"
602
+
603
+ characters:
604
+ "\u0027": ""
605
+ "\u0386": "Á" # Ά
606
+ "\u0391": "A" # Α
607
+ "\u0392": "V" # Β
608
+ "\u0393": "G" # Γ
609
+ "\u0394": "D" # Δ
610
+ "\u0395": "E" # Ε
611
+ "\u0395\u03AA": "Εï" # ΕΪ
612
+ "\u0395\u03CA": "Εï" # Εϊ
613
+ "\u0388\u03CA": "Éï" # Έϊ
614
+ "\u0388\u03CA": "Éï" # Έι
615
+ "\u0396": "Z" # Ζ
616
+ "\u0397": "I̱" # Η
617
+ "\u0398": "Th" # Θ
618
+ "\u0399": "I" # Ι
619
+ "\u039A": "K" # Κ
620
+ "\u039B": "L" # Λ
621
+ "\u039C": "M" # Μ
622
+ "\u039D": "N" # Ν
623
+ "\u039E": "X" # Ξ
624
+ "\u039F": "O" # Ο
625
+ "\u03A0": "P" # Π
626
+ "\u03A1": "R" # Ρ
627
+ "\u03A3": "S" # Σ
628
+ "\u03A4": "T" # Τ
629
+ "\u03A5": "Y" # Υ
630
+ "\u03A6": "F" # Φ
631
+ "\u03A7": "Ch" # Χ
632
+ "\u03A8": "Ps" # Ψ
633
+ "\u03A9": "O̱" # Ω
634
+ "\u0388": "É" # Έ
635
+ "\u0389": "Í̱" # Ή
636
+ "\u038A": "Í" # Ί
637
+ "\u038C": "Ó" # Ό
638
+ "\u038E": "Ý" # Ύ
639
+ "\u038F": "Ó̱" # Ώ
640
+ "\u03AA": "Ï" # Ϊ
641
+ "\u03AB": "Ÿ" # Ϋ
642
+
643
+ "\u03AC": "á" # ά
644
+ "\u03B1": "a" # α
645
+ "\u03B2": "v" # β
646
+ "\u03B3": "g" # γ
647
+ "\u03B4": "d" # δ
648
+ "\u03B5": "e" # ε
649
+ "\u03B5\u03CA": "eï" # εϊ
650
+ "\u03AD\u03CA": "éï" # έϊ
651
+ "\u03AD\u03B9": "éï" # έι
652
+ "\u03B6": "z" # ζ
653
+ "\u03B7": "i̱" # η
654
+ "\u03B8": "th" # θ
655
+ "\u03B9": "i" # ι
656
+ "\u03BA": "k" # κ
657
+ "\u03BB": "l" # λ
658
+ "\u03BC": "m" # μ
659
+ "\u03BD": "n" # ν
660
+ "\u03BE": "x" # ξ
661
+ "\u03BF": "o" # ο
662
+ "\u03C0": "p" # π
663
+ "\u03C1": "r" # ρ
664
+ "\u03C3": "s" # σ
665
+ "\u03C2": "s" # ς
666
+ "\u03C4": "t" # τ
667
+ "\u03C5": "y" # υ
668
+ "\u03C6": "f" # φ
669
+ "\u03C7": "ch" # χ
670
+ "\u03C8": "ps" # ψ
671
+ "\u03C9": "o̱" # ω
672
+ "\u03AD": "é" # έ
673
+ "\u03AE": "í̱" # ή
674
+ "\u03AF": "í" # ί
675
+ "\u03CC": "ó" # ό
676
+ "\u03CD": "ý" # ύ
677
+ "\u03CE": "ó̱" # ώ
678
+ "\u03CA": "ï" # ϊ
679
+ "\u03CB": "ÿ" # ϋ
680
+ "\u0390": "ḯ" # ΐ
681
+ "\u03B0": "ÿ́" # ΰ
682
+
683
+ "\u0387": ";" # ·
684
+ "\u00B7": ";" # ·
685
+