interscript 0.1.1 → 0.1.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.adoc +250 -17
- data/bin/interscript +38 -17
- data/bin/setup +8 -0
- data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
- data/lib/g2pwrapper.py +34 -0
- data/lib/interscript-opal.rb +2 -0
- data/lib/interscript.rb +138 -20
- data/lib/interscript/command.rb +28 -0
- data/lib/interscript/fs.rb +71 -0
- data/lib/interscript/mapping.rb +142 -0
- data/lib/interscript/opal.rb +27 -0
- data/lib/interscript/opal/maps.js.erb +10 -0
- data/lib/interscript/opal_map_translate.rb +12 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +509 -0
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
- data/maps/alalc-ara-Arab-Latn-1997.yaml +1283 -0
- data/maps/alalc-asm-Deva-Latn-1997.yaml +159 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +141 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +125 -0
- data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
- data/maps/alalc-ell-Grek-Latn-1997.yaml +624 -0
- data/maps/alalc-ell-Grek-Latn-2010.yaml +627 -0
- data/maps/alalc-hin-Deva-Latn-2020.yaml +159 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
- data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
- data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +170 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
- data/maps/alalc-pan-Deva-Latn-1997.yaml +237 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +221 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +174 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +169 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
- data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +528 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +592 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +108 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +184 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +285 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +38 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +701 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +19 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +200 -0
- data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +92 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +314 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +162 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
- data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +166 -0
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
- data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
- data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +33 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
- data/maps/ggg-kat-Geor-Latn-2002.yaml +88 -0
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +186 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +118 -0
- data/maps/icao-heb-Hebr-Latn-9303.yaml +151 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-per-Arab-Latn-9303.yaml +103 -0
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +117 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +119 -0
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +609 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +40 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +271 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
- data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
- data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
- data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
- data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
- data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
- data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
- data/maps/sac-zho-Hans-Latn-1979.yaml +24759 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +279 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
- data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
- data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
- data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
- data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
- data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
- data/maps/un-mon-Mong-Latn-2013.yaml +99 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +163 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +30 -0
- data/maps/ungegn-amh-Ethi-Latn-2016.yaml +575 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
- data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
- data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
- data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
- data/spec/interscript/mapping_spec.rb +42 -0
- data/spec/interscript_spec.rb +26 -0
- data/spec/spec_helper.rb +3 -0
- metadata +298 -18
@@ -0,0 +1,323 @@
|
|
1
|
+
---
|
2
|
+
authority_id: iso
|
3
|
+
id: 233-1984
|
4
|
+
language: ara
|
5
|
+
source_script: Arab
|
6
|
+
destination_script: Latn
|
7
|
+
name: ISO 233:1984 Documentation — Transliteration of Arabic characters into Latin characters
|
8
|
+
url:
|
9
|
+
- https://www.iso.org/standard/4117.html
|
10
|
+
- http://transliteration.eki.ee/pdf/Arabic_2.2.pdf
|
11
|
+
- http://www.eki.ee/wgrs/rom1_ar.pdf
|
12
|
+
creation_date: 1984
|
13
|
+
confirmation date: 2018-06
|
14
|
+
description: |
|
15
|
+
Is one of a series of International Standards dealing with
|
16
|
+
the conversion of systems of writing, following the
|
17
|
+
principles of stringent conversion in order to permit
|
18
|
+
international information exchange. Its aim is to provide a
|
19
|
+
means for international communication of written messages
|
20
|
+
in a form which permits the automatic transmission and
|
21
|
+
reconstitution of these by men or machines. Cancels and
|
22
|
+
replaces ISO Recommendation R 233-1961
|
23
|
+
notes:
|
24
|
+
- |
|
25
|
+
The transliteration ISO 233:1984 WRT ara-arab-latn-2017 gives every character and diacritical mark a unique
|
26
|
+
equivalent and e.g. long vowels in Arabic ā, ī and ū are consequently written a’, iy and uw
|
27
|
+
respectively in the ISO transliteration. Other main correspondences
|
28
|
+
ث is ṯ instead of th
|
29
|
+
ج is ǧ instead of j
|
30
|
+
ح is ḥ instead of ẖ
|
31
|
+
خ is ẖ instead of kh
|
32
|
+
ذ is ḏ instead of dh
|
33
|
+
ش is š instead of sh
|
34
|
+
ص is ṣ instead of s̱
|
35
|
+
ض is ḍ instead of ḏ
|
36
|
+
ط is ṭ instead of ṯ
|
37
|
+
ظ is ẓ instead of d͟h
|
38
|
+
غ is ġ instead of gh
|
39
|
+
ة is ẗ instead of h/t
|
40
|
+
ى is ỳ
|
41
|
+
ـِي is iy instead of iy
|
42
|
+
ـُو is uw instead of ū
|
43
|
+
ـَا is a’ instead of ā
|
44
|
+
ـَى is aỳ instead of á
|
45
|
+
|
46
|
+
tests:
|
47
|
+
|
48
|
+
- source: مِصر
|
49
|
+
expected: Miṣr
|
50
|
+
|
51
|
+
- source: قَطَر
|
52
|
+
expected: Qaṭar
|
53
|
+
|
54
|
+
- source: الجُمهُورِيَّة العِرَاقِيَّة
|
55
|
+
expected: Al Ǧumhuwriyaẗ al ‘Ira’qiyaẗ
|
56
|
+
|
57
|
+
- source: جُمهُورِيَّة مِصر العَرَبِيَّة
|
58
|
+
expected: Ǧumhuwriyaẗ Miṣr al ‘Arabiyaẗ
|
59
|
+
|
60
|
+
- source: الرِيَاض
|
61
|
+
expected: Ar Riya’ḍ
|
62
|
+
|
63
|
+
- source: الشارِقة
|
64
|
+
expected: Aš Šâriqaẗ
|
65
|
+
|
66
|
+
map:
|
67
|
+
postrules:
|
68
|
+
- pattern: (?<=\b)(?<!\b[‘|’|'])[\u0061-\uFFFF]
|
69
|
+
result: "upcase"
|
70
|
+
# don't capitalize defined article in the middle of a sentence
|
71
|
+
- pattern : ' At T' # الت
|
72
|
+
result: ' at T'
|
73
|
+
- pattern : ' Aṯ Ṯ' # الث
|
74
|
+
result: ' aṯ Ṯ'
|
75
|
+
- pattern : ' Ad D' # الد
|
76
|
+
result: ' ad D'
|
77
|
+
- pattern : ' Aḏ Ḏ' # الذ
|
78
|
+
result: ' aḏ Ḏ'
|
79
|
+
- pattern : ' Ar R' # الر
|
80
|
+
result: ' ar R'
|
81
|
+
- pattern : ' Az Z' # الز
|
82
|
+
result: ' az Z'
|
83
|
+
- pattern : ' As S' # الس
|
84
|
+
result: ' as S'
|
85
|
+
- pattern : ' Aš Š' # الش
|
86
|
+
result: ' aš Š'
|
87
|
+
- pattern : ' Aṣ Ṣ' # الص
|
88
|
+
result: ' aṣ Ṣ'
|
89
|
+
- pattern : ' Aḍ Ḍ' # الض
|
90
|
+
result: ' aḍ Ḍ'
|
91
|
+
- pattern : ' Aṭ Ṭ' # الط
|
92
|
+
result: ' aṭ Ṭ'
|
93
|
+
- pattern : ' Aẓ Ẓ' # الظ
|
94
|
+
result: ' aẓ Ẓ'
|
95
|
+
- pattern : ' Al L' # الل
|
96
|
+
result: ' al L'
|
97
|
+
- pattern : ' an n' # الن
|
98
|
+
result: ' an N'
|
99
|
+
- pattern: " Al " # ال
|
100
|
+
result: " al "
|
101
|
+
|
102
|
+
characters:
|
103
|
+
|
104
|
+
# pointing
|
105
|
+
'\u064e' : 'a' # َ fatha
|
106
|
+
'\u064e(?=\u0629)' : '' # َ fatha followed by ta' marboota
|
107
|
+
'\u0650' : 'i' # ِ kasra
|
108
|
+
'\u064f' : 'u' # ُ damma
|
109
|
+
'\u0652' : '' # ْ sokoon, see note A below
|
110
|
+
|
111
|
+
# special pointed letters
|
112
|
+
# special pointed letters
|
113
|
+
'\u0639\u064e' : '‘a' # عَ
|
114
|
+
'\u0639\u0650' : '‘i' # عِ
|
115
|
+
'\u0639\u064f' : '‘ū' # عُ
|
116
|
+
# handle MacOS regex difference
|
117
|
+
'\u0639\u064f\u0648' : '‘ū' # عُو damma followed by و
|
118
|
+
|
119
|
+
'\u0650\u064a' : 'iy' # ـِي kasra followed by ي
|
120
|
+
'\u0650\u064a\u0651\u064e' : 'iy' # ـِيَّ
|
121
|
+
'\u0650\u064a(?=\u064e|u064f)' : 'iy' # ـِي kasra followed by ي
|
122
|
+
'\u064e\u0627' : 'a’' # ـَا fatha followed by ا
|
123
|
+
'\u064e\u0649' : 'aỳ' # ـَى fatha followed by ى which is ا not ي
|
124
|
+
'\u064f\u0648' : 'uw' # ـُو damma followed by و
|
125
|
+
'\u064e\u0648\u0652' : 'aw' # ـَوْ
|
126
|
+
'\u064e\u064a\u0652' : 'ay' # ـَيْ
|
127
|
+
|
128
|
+
# Sun letters
|
129
|
+
|
130
|
+
'\b\u0627\u0644\u062a' : 'at t' # الت
|
131
|
+
'\b\u0627\u0644\u062b' : 'aṯ ṯ' # الث
|
132
|
+
'\b\u0627\u0644\u062f' : 'ad d' # الد
|
133
|
+
'\b\u0627\u0644\u0630' : 'aḏ ḏ' # الذ
|
134
|
+
'\b\u0627\u0644\u0631' : 'ar r' # الر
|
135
|
+
'\b\u0627\u0644\u0632' : 'az z' # الز
|
136
|
+
'\b\u0627\u0644\u0633' : 'as s' # الس
|
137
|
+
'\b\u0627\u0644\u0634' : 'aš š' # الش
|
138
|
+
'\b\u0627\u0644\u0635' : 'aṣ ṣ' # الص
|
139
|
+
'\b\u0627\u0644\u0636' : 'aḍ ḍ' # الض
|
140
|
+
'\b\u0627\u0644\u0637' : 'aṭ ṭ' # الط
|
141
|
+
'\b\u0627\u0644\u0638' : 'aẓ ẓ' # الظ
|
142
|
+
'\b\u0627\u0644\u0644' : 'al l' # الل
|
143
|
+
'\b\u0627\u0644\u0646' : 'an n' # الن
|
144
|
+
|
145
|
+
# ta' marboota in iso-233-1984 is all the same `aẗ`
|
146
|
+
'\u0629' : 'aẗ' # ة in the middle of the sentence
|
147
|
+
|
148
|
+
# Shadda
|
149
|
+
|
150
|
+
|
151
|
+
'\u0628\u0651' : 'bb' # ب
|
152
|
+
'\u062a\u0651' : 'tt' # ت
|
153
|
+
'\u062b\u0651' : 'ṯṯ' # ث
|
154
|
+
'\u062c\u0651' : 'ǧǧ' # ج
|
155
|
+
'\u062d\u0651' : 'ḥḥ' # ح
|
156
|
+
'\u062e\u0651' : 'ẖẖ' # خ
|
157
|
+
'\u062f\u0651' : 'dd' # د
|
158
|
+
'\u0630\u0651' : 'ḏḏ' # ذ
|
159
|
+
'\u0631\u0651' : 'rr' # ر
|
160
|
+
'\u0632\u0651' : 'zz' # ز
|
161
|
+
'\u0633\u0651' : 'ss' # س
|
162
|
+
'\u0634\u0651' : 'šš' # ش
|
163
|
+
'\u0635\u0651' : 'ṣṣ' # ص
|
164
|
+
'\u0636\u0651' : 'ḍḍ' # ض
|
165
|
+
'\u0637\u0651' : 'ṭṭ' # ط
|
166
|
+
'\u0638\u0651' : 'ẓẓ' # ظ
|
167
|
+
'\u063a\u0651' : 'ġġ' # غ
|
168
|
+
'\u0641\u0651' : 'ff' # ف
|
169
|
+
'\u0642\u0651' : 'qq' # ق
|
170
|
+
'\u0643\u0651' : 'kk' # ك
|
171
|
+
'\u0644\u0651' : 'll' # ل
|
172
|
+
'\u0645\u0651' : 'mm' # م
|
173
|
+
'\u0646\u0651' : 'nn' # ن
|
174
|
+
'\u0647\u0651' : 'hh' # ه
|
175
|
+
'\u0648\u0651' : 'ww' # و
|
176
|
+
'\u064a\u0651' : 'yy' # ي
|
177
|
+
|
178
|
+
|
179
|
+
'\u0622' : '’â' # آ
|
180
|
+
|
181
|
+
'\u0627' : 'â' # ا
|
182
|
+
|
183
|
+
'\u0649' : 'ỳ' # ى
|
184
|
+
|
185
|
+
'\u0626' : "'" # ئ
|
186
|
+
|
187
|
+
|
188
|
+
'\u0621' : # ء
|
189
|
+
- '’'
|
190
|
+
- '' # see note A
|
191
|
+
|
192
|
+
'\u0623' : 'a' # أ
|
193
|
+
|
194
|
+
# See note B
|
195
|
+
'\b\u0627\u0644' : 'al ' # ال
|
196
|
+
# '\uFE8E' : '' # ﺎ
|
197
|
+
|
198
|
+
'\u0628' : 'b' # ب
|
199
|
+
'\uFE91' : 'b' # ﺑ
|
200
|
+
'\uFE92' : 'b' # ﺒ
|
201
|
+
'\uFE90' : 'b' # ﺐ
|
202
|
+
|
203
|
+
# See note C
|
204
|
+
'\u062a' : 't' # ت
|
205
|
+
'\ufe97' : 't' # ﺗ
|
206
|
+
'\ufe98' : 't' # ﺘ
|
207
|
+
'\ufe96' : 't' # ﺖ
|
208
|
+
|
209
|
+
'\u062b' : 'ṯ' # ث
|
210
|
+
'\ufe9b' : 'ṯ' # ﺛ
|
211
|
+
'\ufe9c' : 'ṯ' # ﺜ
|
212
|
+
'\ufe9a' : 'ṯ' # ﺚ
|
213
|
+
|
214
|
+
'\u062c' : 'ǧ' # ج
|
215
|
+
'\ufe9f' : 'ǧ' # ﺟ
|
216
|
+
'\ufea0' : 'ǧ' # ﺠ
|
217
|
+
'\ufe9e' : 'ǧ' # ﺞ
|
218
|
+
|
219
|
+
'\u062d' : 'ḥ' # ح
|
220
|
+
'\ufea3' : 'ḥ' # ﺣ
|
221
|
+
'\ufea4' : 'ḥ' # ﺤ
|
222
|
+
'\ufea2' : 'ḥ' # ﺢ
|
223
|
+
|
224
|
+
'\u062e' : 'ẖ' # خ
|
225
|
+
'\ufea7' : 'ẖ' # ﺧ
|
226
|
+
'\ufea8' : 'ẖ' # ﺨ
|
227
|
+
'\ufea6' : 'ẖ' # ﺦ
|
228
|
+
|
229
|
+
'\u062f' : 'd' # د
|
230
|
+
'\ufeaa' : 'd' # ﺪ
|
231
|
+
|
232
|
+
'\u0630' : 'ḏ' # ذ
|
233
|
+
'\ufeac' : 'ḏ' # ﺬ
|
234
|
+
|
235
|
+
'\u0631' : 'r' # ر
|
236
|
+
'\ufeae' : 'r' # ﺮ
|
237
|
+
|
238
|
+
'\u0632' : 'z' # ز
|
239
|
+
'\ufeb0' : 'z' # ﺰ
|
240
|
+
|
241
|
+
'\u0633' : 's' # س
|
242
|
+
'\ufeb3' : 's' # ﺳ
|
243
|
+
'\ufeb4' : 's' # ﺴ
|
244
|
+
'\ufeb2' : 's' # ﺲ
|
245
|
+
|
246
|
+
'\u0634' : 'š' # ش
|
247
|
+
'\ufeb7' : 'š' # ﺷ
|
248
|
+
'\ufeb8' : 'š' # ﺸ
|
249
|
+
'\ufeb6' : 'š' # ﺶ
|
250
|
+
|
251
|
+
'\u0635' : 'ṣ' # ص
|
252
|
+
'\ufebb' : 'ṣ' # ﺻ
|
253
|
+
'\ufebc' : 'ṣ' # ﺼ
|
254
|
+
'\ufeba' : 'ṣ' # ﺺ
|
255
|
+
|
256
|
+
'\u0636' : 'ḍ' # ض
|
257
|
+
'\ufebf' : 'ḍ' # ﺿ
|
258
|
+
'\ufec0' : 'ḍ' # ﻀ
|
259
|
+
'\ufebe' : 'ḍ' # ﺾ
|
260
|
+
|
261
|
+
'\u0637' : 'ṭ' # ط
|
262
|
+
'\ufec3' : 'ṭ' # ﻃ
|
263
|
+
'\ufec4' : 'ṭ' # ﻄ
|
264
|
+
'\ufec2' : 'ṭ' # ﻂ
|
265
|
+
|
266
|
+
'\u0638' : 'ẓ' # ظ
|
267
|
+
'\ufec7' : 'ẓ' # ﻇ
|
268
|
+
'\ufec8' : 'ẓ' # ﻈ
|
269
|
+
'\ufec6' : 'ẓ' # ﻆ
|
270
|
+
|
271
|
+
'\u0639' : '‘' # ع
|
272
|
+
'\ufecb' : '‘' # ﻋ
|
273
|
+
'\ufecc' : '‘' # ﻌ
|
274
|
+
'\ufeca' : '‘' # ﻊ
|
275
|
+
|
276
|
+
'\u063a' : 'ġ' # غ
|
277
|
+
'\ufecf' : 'ġ' # ﻏ
|
278
|
+
'\ufed0' : 'ġ' # ﻐ
|
279
|
+
'\ufece' : 'ġ' # ﻎ
|
280
|
+
|
281
|
+
'\u0641' : 'f' # ف
|
282
|
+
'\ufed3' : 'f' # ﻓ
|
283
|
+
'\ufed4' : 'f' # ﻔ
|
284
|
+
'\ufed2' : 'f' # ﻒ
|
285
|
+
|
286
|
+
'\u0642' : 'q' # ق
|
287
|
+
'\ufed7' : 'q' # ﻗ
|
288
|
+
'\ufed8' : 'q' # ﻘ
|
289
|
+
'\ufed6' : 'q' # ﻖ
|
290
|
+
|
291
|
+
'\u0643' : 'k' # ك
|
292
|
+
'\ufedb' : 'k' # ﻛ
|
293
|
+
'\ufedc' : 'k' # ﻜ
|
294
|
+
'\ufeda' : 'k' # ﻚ
|
295
|
+
|
296
|
+
'\u0644' : 'l' # ل
|
297
|
+
'\ufedf' : 'l' # ﻟ
|
298
|
+
'\ufee0' : 'l' # ﻠ
|
299
|
+
'\ufede' : 'l' # ﻞ
|
300
|
+
|
301
|
+
'\u0645' : 'm' # م
|
302
|
+
'\ufee3' : 'm' # ﻣ
|
303
|
+
'\ufee4' : 'm' # ﻤ
|
304
|
+
'\ufee2' : 'm' # ﻢ
|
305
|
+
|
306
|
+
'\u0646' : 'n' # ن
|
307
|
+
'\ufee7' : 'n' # ﻧ
|
308
|
+
'\ufee8' : 'n' # ﻨ
|
309
|
+
'\ufee6' : 'n' # ﻦ
|
310
|
+
|
311
|
+
# See note C
|
312
|
+
'\u0647' : 'h' # ه
|
313
|
+
'\ufeeb' : 'h' # ﻫ
|
314
|
+
'\ufeec' : 'h' # ﻬ
|
315
|
+
'\ufeea' : 'h' # ﻪ
|
316
|
+
|
317
|
+
'\u0648' : 'w' # و
|
318
|
+
'\ufeee' : 'w' # ﻮ
|
319
|
+
|
320
|
+
'\u064a' : 'y' # ي
|
321
|
+
'\ufef3' : 'y' # ﻳ
|
322
|
+
'\ufef4' : 'y' # ﻴ
|
323
|
+
'\ufef1' : 'y' # ﻱ
|
@@ -0,0 +1,609 @@
|
|
1
|
+
---
|
2
|
+
authority_id: iso
|
3
|
+
id: 1997
|
4
|
+
language: ell
|
5
|
+
source_script: Grek
|
6
|
+
destination_script: Latn
|
7
|
+
name: ISO 843:1997
|
8
|
+
url:
|
9
|
+
creation_date: 1997
|
10
|
+
description: |
|
11
|
+
ISO Transliteration table for Greek
|
12
|
+
|
13
|
+
note:
|
14
|
+
- Transliteration of Greek into Latin: Type 1, Clause 3 Table 1
|
15
|
+
- Equivalent to elot-ell-Grek-Latn-743-2001-ts, the transliteration table of ELOT 743:2001
|
16
|
+
- Assuming that ou, au, eu transliterations are only intended for historical diphthongs /u, av, ev/, and that όυ, άυ, έυ are not to be transliterated as ou, au, eu
|
17
|
+
- Introduced casing to digamma and lunate sigma. (Casing was late introduction to character sets for those characters)
|
18
|
+
|
19
|
+
tests:
|
20
|
+
|
21
|
+
- source: |
|
22
|
+
Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
|
23
|
+
|
24
|
+
Γιάννης Μακρυγιάννης.
|
25
|
+
|
26
|
+
expected: |
|
27
|
+
Éna práma mónon me parakínīse ki eména na grápsō óti toútīn tīn patrída tīn échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai ftōchoí kai politikoí kai stratiōtikoí kai oi pléon mikróteroi ánthrōpoi; ósoi agōnistī́kamen, analógōs o katheís, échomen na zī́somen edṓ. To loipón doulépsamen óloi mazí, na tīn fylámen ki óloi mazí kai na mīn légei oúte o dynatós «egṓ» oúte o adýnatos. Xérete póte na légei o katheís «egṓ»? Ótan agōnisteí mónos tou kai fkiásei ī́ chalásei, na légei «egṓ»; ótan ómōs agōnízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egṓ». Kai eis to exī́s na máthomen gnṓsī, an thélomen na fkiásomen chōrión, na zī́somen óloi mazí.
|
28
|
+
|
29
|
+
Giánnīs Makrygiánnīs.
|
30
|
+
|
31
|
+
|
32
|
+
- source: ΑΘΗΝΑ
|
33
|
+
expected: ATHĪNA
|
34
|
+
- source: μπαμπάκι
|
35
|
+
expected: mpampáki
|
36
|
+
- source: νταντά
|
37
|
+
expected: ntantá
|
38
|
+
- source: γκέγκε
|
39
|
+
expected: gkégke
|
40
|
+
- source: Γκαμπόν
|
41
|
+
expected: Gkampón
|
42
|
+
- source: Μάγχη
|
43
|
+
expected: Mágchī
|
44
|
+
- source: κογξ
|
45
|
+
expected: kogx
|
46
|
+
- source: υιός
|
47
|
+
expected: yiós
|
48
|
+
- source: Υιός
|
49
|
+
expected: Yiós
|
50
|
+
- source: νεράντζι
|
51
|
+
expected: nerántzi
|
52
|
+
- source: Γοίθιος
|
53
|
+
expected: Goíthios
|
54
|
+
- source: μπέικον
|
55
|
+
expected: mpéikon
|
56
|
+
- source: μπέϊκον
|
57
|
+
expected: mpéïkon
|
58
|
+
- source: βόλεϊ
|
59
|
+
expected: vóleï
|
60
|
+
- source: αθεΐα
|
61
|
+
expected: atheḯa
|
62
|
+
- source: Εϊγιαφιάτλαγιοκουτλ
|
63
|
+
expected: Eïgiafiátlagiokoutl
|
64
|
+
- source: Εΐτζι
|
65
|
+
expected: Eḯtzi
|
66
|
+
- source: Μυρτώο
|
67
|
+
expected: Myrtṓo
|
68
|
+
- source: αέρας
|
69
|
+
expected: aéras
|
70
|
+
- source: γαυ γαυ
|
71
|
+
expected: gau gau
|
72
|
+
- source: Ταΰγετος
|
73
|
+
expected: Taÿ́getos
|
74
|
+
- source: σπρέυ
|
75
|
+
expected: spréy
|
76
|
+
|
77
|
+
- source: Αθήνα
|
78
|
+
expected: Athī́na
|
79
|
+
- source: Άγιον Όρος
|
80
|
+
expected: Ágion Óros
|
81
|
+
- source: Άγραφα
|
82
|
+
expected: Ágrafa
|
83
|
+
- source: Αγρίνιο
|
84
|
+
expected: Agrínio
|
85
|
+
- source: Αίγινα
|
86
|
+
expected: Aígina
|
87
|
+
- source: Αίγιο
|
88
|
+
expected: Aígio
|
89
|
+
- source: Αλεξανδρούπολη
|
90
|
+
expected: Alexandroúpolī
|
91
|
+
- source: Αλεποχώρι
|
92
|
+
expected: Alepochṓri
|
93
|
+
- source: Αμοργός
|
94
|
+
expected: Amorgós
|
95
|
+
- source: Άμφισσα
|
96
|
+
expected: Ámfissa
|
97
|
+
- source: Αράχωβα
|
98
|
+
expected: Aráchōva
|
99
|
+
- source: Άργος
|
100
|
+
expected: Árgos
|
101
|
+
- source: Αρκαδία
|
102
|
+
expected: Arkadía
|
103
|
+
- source: Άρτα
|
104
|
+
expected: Árta
|
105
|
+
- source: Βελούχι
|
106
|
+
expected: Veloúchi
|
107
|
+
- source: Βέροια
|
108
|
+
expected: Véroia
|
109
|
+
- source: Βοιωτία
|
110
|
+
expected: Voiōtía
|
111
|
+
- source: Βόλος
|
112
|
+
expected: Vólos
|
113
|
+
- source: Βόνιτσα
|
114
|
+
expected: Vónitsa
|
115
|
+
- source: Γαλαξίδι
|
116
|
+
expected: Galaxídi
|
117
|
+
- source: Γαλάτσι
|
118
|
+
expected: Galátsi
|
119
|
+
- source: Γιαννιτσά
|
120
|
+
expected: Giannitsá
|
121
|
+
- source: Γλυφάδα
|
122
|
+
expected: Glyfáda
|
123
|
+
- source: Γρανίτσα
|
124
|
+
expected: Granítsa
|
125
|
+
- source: Γρεβενά
|
126
|
+
expected: Grevená
|
127
|
+
- source: Γύθειο
|
128
|
+
expected: Gýtheio
|
129
|
+
- source: Διόνυσος
|
130
|
+
expected: Diónysos
|
131
|
+
- source: Δίστομο
|
132
|
+
expected: Dístomo
|
133
|
+
- source: Δολιανά
|
134
|
+
expected: Dolianá
|
135
|
+
- source: Δράμα
|
136
|
+
expected: Dráma
|
137
|
+
- source: Δωδεκάνησα
|
138
|
+
expected: Dōdekánīsa
|
139
|
+
- source: Έδεσσα
|
140
|
+
expected: Édessa
|
141
|
+
- source: Ελευσίνα
|
142
|
+
expected: Eleusína
|
143
|
+
- source: Επίδαυρος
|
144
|
+
expected: Epídauros
|
145
|
+
- source: Επτάνησα
|
146
|
+
expected: Eptánīsa
|
147
|
+
- source: Ερμούπολη
|
148
|
+
expected: Ermoúpolī
|
149
|
+
- source: Εύβοια
|
150
|
+
expected: Eúvoia
|
151
|
+
- source: Ζάκυνθος
|
152
|
+
expected: Zákynthos
|
153
|
+
- source: Ήπειρος
|
154
|
+
expected: Ī́peiros
|
155
|
+
- source: Ηράκλειο
|
156
|
+
expected: Īrákleio
|
157
|
+
- source: Θάσος
|
158
|
+
expected: Thásos
|
159
|
+
- source: Θεσσαλονίκη
|
160
|
+
expected: Thessaloníkī
|
161
|
+
- source: Θεσσαλία
|
162
|
+
expected: Thessalía
|
163
|
+
- source: Θεσπρωτία
|
164
|
+
expected: Thesprōtía
|
165
|
+
- source: Θήβα
|
166
|
+
expected: Thī́va
|
167
|
+
- source: Θράκη
|
168
|
+
expected: Thrákī
|
169
|
+
- source: Ιθάκη
|
170
|
+
expected: Ithákī
|
171
|
+
- source: Ίος
|
172
|
+
expected: Íos
|
173
|
+
- source: Ιωάννινα
|
174
|
+
expected: Iōánnina
|
175
|
+
- source: Καβάλα
|
176
|
+
expected: Kavála
|
177
|
+
- source: Καλάβρυτα
|
178
|
+
expected: Kalávryta
|
179
|
+
- source: Καλαμάτα
|
180
|
+
expected: Kalamáta
|
181
|
+
- source: Καλαμπάκα
|
182
|
+
expected: Kalampáka
|
183
|
+
- source: Καλύβια
|
184
|
+
expected: Kalývia
|
185
|
+
- source: Κάλυμνος
|
186
|
+
expected: Kálymnos
|
187
|
+
- source: Καρδίτσα
|
188
|
+
expected: Kardítsa
|
189
|
+
- source: Καρπενήσι
|
190
|
+
expected: Karpenī́si
|
191
|
+
- source: Κάρυστος
|
192
|
+
expected: Kárystos
|
193
|
+
- source: Καστελλόριζο
|
194
|
+
expected: Kastellórizo
|
195
|
+
- source: Καστοριά
|
196
|
+
expected: Kastoriá
|
197
|
+
- source: Κατερίνη
|
198
|
+
expected: Katerínī
|
199
|
+
- source: Κάτω Αχαΐα
|
200
|
+
expected: Kátō Achaḯa
|
201
|
+
- source: Κερατέα
|
202
|
+
expected: Keratéa
|
203
|
+
- source: Κέρκυρα
|
204
|
+
expected: Kérkyra
|
205
|
+
- source: Κεφαλλονιά
|
206
|
+
expected: Kefalloniá
|
207
|
+
- source: Κηφισιά
|
208
|
+
expected: Kīfisiá
|
209
|
+
- source: Κιλκίς
|
210
|
+
expected: Kilkís
|
211
|
+
- source: Κοζάνη
|
212
|
+
expected: Kozánī
|
213
|
+
- source: Κολωνός
|
214
|
+
expected: Kolōnós
|
215
|
+
- source: Κομοτηνή
|
216
|
+
expected: Komotīnī́
|
217
|
+
- source: Κόρινθος
|
218
|
+
expected: Kórinthos
|
219
|
+
- source: Κορώνη
|
220
|
+
expected: Korṓnī
|
221
|
+
- source: Κρανίδι
|
222
|
+
expected: Kranídi
|
223
|
+
- source: Κρέστενα
|
224
|
+
expected: Kréstena
|
225
|
+
- source: Κρήτη
|
226
|
+
expected: Krī́tī
|
227
|
+
- source: Κύθηρα
|
228
|
+
expected: Kýthīra
|
229
|
+
- source: Κυκλάδες
|
230
|
+
expected: Kykládes
|
231
|
+
- source: Κύμη
|
232
|
+
expected: Kýmī
|
233
|
+
- source: Κυψέλη
|
234
|
+
expected: Kypsélī
|
235
|
+
- source: Κως
|
236
|
+
expected: Kōs
|
237
|
+
- source: Λαγκαδάς
|
238
|
+
expected: Lagkadás
|
239
|
+
- source: Λαμία
|
240
|
+
expected: Lamía
|
241
|
+
- source: Λάρισα
|
242
|
+
expected: Lárisa
|
243
|
+
- source: Λαύριο
|
244
|
+
expected: Laúrio
|
245
|
+
- source: Λέρος
|
246
|
+
expected: Léros
|
247
|
+
- source: Λέσβος
|
248
|
+
expected: Lésvos
|
249
|
+
- source: Λευκάδα
|
250
|
+
expected: Leukáda
|
251
|
+
- source: Λήμνος
|
252
|
+
expected: Lī́mnos
|
253
|
+
- source: Λιβαδειά
|
254
|
+
expected: Livadeiá
|
255
|
+
- source: Μακεδονία
|
256
|
+
expected: Makedonía
|
257
|
+
- source: Μάνη
|
258
|
+
expected: Mánī
|
259
|
+
- source: Μαραθώνας
|
260
|
+
expected: Marathṓnas
|
261
|
+
- source: Μαρκόπουλο
|
262
|
+
expected: Markópoulo
|
263
|
+
- source: Μαρούσι
|
264
|
+
expected: Maroúsi
|
265
|
+
- source: Μέγαρα
|
266
|
+
expected: Mégara
|
267
|
+
- source: Μεσολόγγι
|
268
|
+
expected: Mesológgi
|
269
|
+
- source: Μεταξουργείο
|
270
|
+
expected: Metaxourgeío
|
271
|
+
- source: Μέτσοβο
|
272
|
+
expected: Métsovo
|
273
|
+
- source: Μήλος
|
274
|
+
expected: Mī́los
|
275
|
+
- source: Μύκονος
|
276
|
+
expected: Mýkonos
|
277
|
+
- source: Μυστράς
|
278
|
+
expected: Mystrás
|
279
|
+
- source: Μυτιλήνη
|
280
|
+
expected: Mytilī́nī
|
281
|
+
- source: Νάξος
|
282
|
+
expected: Náxos
|
283
|
+
- source: Νάουσα
|
284
|
+
expected: Náousa
|
285
|
+
- source: Ναύπακτος
|
286
|
+
expected: Naúpaktos
|
287
|
+
- source: Ναύπλιο
|
288
|
+
expected: Naúplio
|
289
|
+
- source: Νέα Σμύρνη
|
290
|
+
expected: Néa Smýrnī
|
291
|
+
- source: Νίσυρος
|
292
|
+
expected: Nísyros
|
293
|
+
- source: Ξάνθη
|
294
|
+
expected: Xánthī
|
295
|
+
- source: Όλυμπος
|
296
|
+
expected: Ólympos
|
297
|
+
- source: Παγκράτι
|
298
|
+
expected: Pagkráti
|
299
|
+
- source: Παπάγου
|
300
|
+
expected: Papágou
|
301
|
+
- source: Πάρος
|
302
|
+
expected: Páros
|
303
|
+
- source: Πασαλιμάνι
|
304
|
+
expected: Pasalimáni
|
305
|
+
- source: Πατήσια
|
306
|
+
expected: Patī́sia
|
307
|
+
- source: Πάτμος
|
308
|
+
expected: Pátmos
|
309
|
+
- source: Πάτρα
|
310
|
+
expected: Pátra
|
311
|
+
- source: Πειραιάς
|
312
|
+
expected: Peiraiás
|
313
|
+
- source: Πελοπόννησος
|
314
|
+
expected: Pelopónnīsos
|
315
|
+
- source: Περιστέρι
|
316
|
+
expected: Peristéri
|
317
|
+
- source: Πεύκη
|
318
|
+
expected: Peúkī
|
319
|
+
- source: Πήλιο
|
320
|
+
expected: Pī́lio
|
321
|
+
- source: Πολύγυρος
|
322
|
+
expected: Polýgyros
|
323
|
+
- source: Πόρος
|
324
|
+
expected: Póros
|
325
|
+
- source: Πρέβεζα
|
326
|
+
expected: Préveza
|
327
|
+
- source: Πτολεμαΐδα
|
328
|
+
expected: Ptolemaḯda
|
329
|
+
- source: Πύλος
|
330
|
+
expected: Pýlos
|
331
|
+
- source: Πύργος
|
332
|
+
expected: Pýrgos
|
333
|
+
- source: Ρέθυμνο
|
334
|
+
expected: Réthymno
|
335
|
+
- source: Ρόδος
|
336
|
+
expected: Ródos
|
337
|
+
- source: Ρούμελη
|
338
|
+
expected: Roúmelī
|
339
|
+
- source: Σαλαμίνα
|
340
|
+
expected: Salamína
|
341
|
+
- source: Σαμοθράκη
|
342
|
+
expected: Samothrákī
|
343
|
+
- source: Σάμος
|
344
|
+
expected: Sámos
|
345
|
+
- source: Σαντορίνη
|
346
|
+
expected: Santorínī
|
347
|
+
- source: Σέρρες
|
348
|
+
expected: Sérres
|
349
|
+
- source: Σίκινος
|
350
|
+
expected: Síkinos
|
351
|
+
- source: Σίφνος
|
352
|
+
expected: Sífnos
|
353
|
+
- source: Σκιάθος
|
354
|
+
expected: Skiáthos
|
355
|
+
- source: Σκόπελος
|
356
|
+
expected: Skópelos
|
357
|
+
- source: Σούλι
|
358
|
+
expected: Soúli
|
359
|
+
- source: Σπάρτη
|
360
|
+
expected: Spártī
|
361
|
+
- source: Στερεά Ελλάδα
|
362
|
+
expected: Stereá Elláda
|
363
|
+
- source: Στύρα
|
364
|
+
expected: Stýra
|
365
|
+
- source: Σύμη
|
366
|
+
expected: Sýmī
|
367
|
+
- source: Σύρος
|
368
|
+
expected: Sýros
|
369
|
+
- source: Σφακιά
|
370
|
+
expected: Sfakiá
|
371
|
+
- source: Τήλος
|
372
|
+
expected: Tī́los
|
373
|
+
- source: Τήνος
|
374
|
+
expected: Tī́nos
|
375
|
+
- source: Τρίκαλα
|
376
|
+
expected: Tríkala
|
377
|
+
- source: Τρίπολη
|
378
|
+
expected: Trípolī
|
379
|
+
- source: Τσακωνιά
|
380
|
+
expected: Tsakōniá
|
381
|
+
- source: Ύδρα
|
382
|
+
expected: Ýdra
|
383
|
+
- source: Φάληρο
|
384
|
+
expected: Fálīro
|
385
|
+
- source: Φλώρινα
|
386
|
+
expected: Flṓrina
|
387
|
+
- source: Φολέγανδρος
|
388
|
+
expected: Folégandros
|
389
|
+
- source: Χάλκη
|
390
|
+
expected: Chálkī
|
391
|
+
- source: Χαλκίδα
|
392
|
+
expected: Chalkída
|
393
|
+
- source: Χαλάνδρι
|
394
|
+
expected: Chalándri
|
395
|
+
- source: Χαλκιδική
|
396
|
+
expected: Chalkidikī́
|
397
|
+
- source: Χανιά
|
398
|
+
expected: Chaniá
|
399
|
+
- source: Χίος
|
400
|
+
expected: Chíos
|
401
|
+
- source: Ψαρά
|
402
|
+
expected: Psará
|
403
|
+
- source: Αβάνα
|
404
|
+
expected: Avána
|
405
|
+
- source: Αγγλία
|
406
|
+
expected: Agglía
|
407
|
+
- source: Αϊβαλί
|
408
|
+
expected: Aïvalí
|
409
|
+
- source: Αλεξάνδρεια
|
410
|
+
expected: Alexándreia
|
411
|
+
- source: Άμστερνταμ
|
412
|
+
expected: Ámsterntam
|
413
|
+
- source: Βαυαρία
|
414
|
+
expected: Vauaría
|
415
|
+
- source: Βενετία
|
416
|
+
expected: Venetía
|
417
|
+
- source: Βερολίνο
|
418
|
+
expected: Verolíno
|
419
|
+
- source: Βερόνα
|
420
|
+
expected: Veróna
|
421
|
+
- source: Βιέννη
|
422
|
+
expected: Viénnī
|
423
|
+
- source: Γένοβα
|
424
|
+
expected: Génova
|
425
|
+
- source: Δουβλίνο
|
426
|
+
expected: Douvlíno
|
427
|
+
- source: Καλαβρία
|
428
|
+
expected: Kalavría
|
429
|
+
- source: Καλιφόρνια
|
430
|
+
expected: Kalifórnia
|
431
|
+
- source: Καύκασος
|
432
|
+
expected: Kaúkasos
|
433
|
+
- source: Κονγκό
|
434
|
+
expected: Kongkó
|
435
|
+
- source: Κορσική
|
436
|
+
expected: Korsikī́
|
437
|
+
- source: Κουρδιστάν
|
438
|
+
expected: Kourdistán
|
439
|
+
- source: Κωνσταντινούπολη
|
440
|
+
expected: Kōnstantinoúpolī
|
441
|
+
- source: Κατεχόμενη Κύπρος
|
442
|
+
expected: Katechómenī Kýpros
|
443
|
+
- source: Λαπωνία
|
444
|
+
expected: Lapōnía
|
445
|
+
- source: Λευκωσία
|
446
|
+
expected: Leukōsía
|
447
|
+
- source: Λιβόρνο
|
448
|
+
expected: Livórno
|
449
|
+
- source: Λονδίνο
|
450
|
+
expected: Londíno
|
451
|
+
- source: Λυών
|
452
|
+
expected: Lyṓn
|
453
|
+
- source: Μάλαγα
|
454
|
+
expected: Málaga
|
455
|
+
- source: Μασσαλία
|
456
|
+
expected: Massalía
|
457
|
+
- source: Μικρονησία
|
458
|
+
expected: Mikronīsía
|
459
|
+
- source: Μιλάνο
|
460
|
+
expected: Miláno
|
461
|
+
- source: Μόσχα
|
462
|
+
expected: Móscha
|
463
|
+
- source: Μπολόνια
|
464
|
+
expected: Mpolónia
|
465
|
+
- source: Νάπολη
|
466
|
+
expected: Nápolī
|
467
|
+
- source: Νταγκεστάν
|
468
|
+
expected: Ntagkestán
|
469
|
+
- source: Νέα Υόρκη
|
470
|
+
expected: Néa Yórkī
|
471
|
+
- source: Οξφόρδη
|
472
|
+
expected: Oxfórdī
|
473
|
+
- source: Ουαλία
|
474
|
+
expected: Oualía
|
475
|
+
- source: Παρίσι
|
476
|
+
expected: Parísi
|
477
|
+
- source: Πάφος
|
478
|
+
expected: Páfos
|
479
|
+
- source: Πολυνησία
|
480
|
+
expected: Polynīsía
|
481
|
+
- source: Ρώμη
|
482
|
+
expected: Rṓmī
|
483
|
+
- source: Σαμάρεια
|
484
|
+
expected: Samáreia
|
485
|
+
- source: Σικελία
|
486
|
+
expected: Sikelía
|
487
|
+
- source: Σκανδιναβία
|
488
|
+
expected: Skandinavía
|
489
|
+
- source: Σκόπια
|
490
|
+
expected: Skópia
|
491
|
+
- source: Σκωτία
|
492
|
+
expected: Skōtía
|
493
|
+
- source: Σμύρνη
|
494
|
+
expected: Smýrnī
|
495
|
+
- source: Ταϊτή
|
496
|
+
expected: Taïtī́
|
497
|
+
- source: Ταταρστάν
|
498
|
+
expected: Tatarstán
|
499
|
+
- source: Τζαμάικα
|
500
|
+
expected: Tzamáika
|
501
|
+
- source: Τηλλυρία
|
502
|
+
expected: Tīllyría
|
503
|
+
- source: Τιρόλο
|
504
|
+
expected: Tirólo
|
505
|
+
- source: Τορίνο
|
506
|
+
expected: Toríno
|
507
|
+
- source: Φανάρι
|
508
|
+
expected: Fanári
|
509
|
+
- source: Φλωρεντία
|
510
|
+
expected: Flōrentía
|
511
|
+
- source: Χαβάη
|
512
|
+
expected: Chaváī
|
513
|
+
- source: Χονγκ Κονγκ
|
514
|
+
expected: Chongk Kongk
|
515
|
+
|
516
|
+
map:
|
517
|
+
# https://en.wikipedia.org/wiki/Romanization_of_Greek
|
518
|
+
rules:
|
519
|
+
- pattern: (?<=[ΑαΕεΟο])\u03A5 # Υ (after Α, Ε, Η)
|
520
|
+
result: U
|
521
|
+
- pattern: (?<=[ΑαΕεΟο])\u03C5 # υ (after Α, Ε, Η)
|
522
|
+
result: u
|
523
|
+
- pattern: (?<=[ΑαΕεΟο])\u03CD # ύ (after Ο)
|
524
|
+
result: ú
|
525
|
+
- pattern: \u037E # ;
|
526
|
+
result: "?"
|
527
|
+
- pattern: \u003B # ;
|
528
|
+
result: "?"
|
529
|
+
|
530
|
+
characters:
|
531
|
+
"\u0027": ""
|
532
|
+
"\u0386": "Á" # Ά
|
533
|
+
"\u0391": "A" # Α
|
534
|
+
"\u0392": "V" # Β
|
535
|
+
"\u0393": "G" # Γ
|
536
|
+
"\u0394": "D" # Δ
|
537
|
+
"\u0395": "E" # Ε
|
538
|
+
"\u0396": "Z" # Ζ
|
539
|
+
"\u0397": "Ī" # Η
|
540
|
+
"\u0398": "Th" # Θ
|
541
|
+
"\u0399": "I" # Ι
|
542
|
+
"\u039A": "K" # Κ
|
543
|
+
"\u039B": "L" # Λ
|
544
|
+
"\u039C": "M" # Μ
|
545
|
+
"\u039D": "N" # Ν
|
546
|
+
"\u039E": "X" # Ξ
|
547
|
+
"\u039F": "O" # Ο
|
548
|
+
"\u03A0": "P" # Π
|
549
|
+
"\u03A1": "R" # Ρ
|
550
|
+
"\u03A3": "S" # Σ
|
551
|
+
"\u03A4": "T" # Τ
|
552
|
+
"\u03A5": "Y" # Υ
|
553
|
+
"\u03A6": "F" # Φ
|
554
|
+
"\u03A7": "Ch" # Χ
|
555
|
+
"\u03A8": "Ps" # Ψ
|
556
|
+
"\u03A9": "Ō" # Ω
|
557
|
+
"\u0388": "É" # Έ
|
558
|
+
"\u0389": "Ī́" # Ή
|
559
|
+
"\u038A": "Í" # Ί
|
560
|
+
"\u038C": "Ó" # Ό
|
561
|
+
"\u038E": "Ý" # Ύ
|
562
|
+
"\u038F": "Ṓ" # Ώ
|
563
|
+
"\u03AA": "Ï" # Ϊ
|
564
|
+
"\u03AB": "Ÿ" # Ϋ
|
565
|
+
|
566
|
+
"\u03AC": "á" # ά
|
567
|
+
"\u03B1": "a" # α
|
568
|
+
"\u03B2": "v" # β
|
569
|
+
"\u03B3": "g" # γ
|
570
|
+
"\u03B4": "d" # δ
|
571
|
+
"\u03B5": "e" # ε
|
572
|
+
"\u03B6": "z" # ζ
|
573
|
+
"\u03B7": "ī" # η
|
574
|
+
"\u03B8": "th" # θ
|
575
|
+
"\u03B9": "i" # ι
|
576
|
+
"\u03BA": "k" # κ
|
577
|
+
"\u03BB": "l" # λ
|
578
|
+
"\u03BC": "m" # μ
|
579
|
+
"\u03BD": "n" # ν
|
580
|
+
"\u03BE": "x" # ξ
|
581
|
+
"\u03BF": "o" # ο
|
582
|
+
"\u03C0": "p" # π
|
583
|
+
"\u03C1": "r" # ρ
|
584
|
+
"\u03C3": "s" # σ
|
585
|
+
"\u03C2": "s" # ς
|
586
|
+
"\u03C4": "t" # τ
|
587
|
+
"\u03C5": "y" # υ
|
588
|
+
"\u03C6": "f" # φ
|
589
|
+
"\u03C7": "ch" # χ
|
590
|
+
"\u03C8": "ps" # ψ
|
591
|
+
"\u03C9": "ō" # ω
|
592
|
+
"\u03AD": "é" # έ
|
593
|
+
"\u03AE": "ī́" # ή
|
594
|
+
"\u03AF": "í" # ί
|
595
|
+
"\u03CC": "ó" # ό
|
596
|
+
"\u03CD": "ý" # ύ
|
597
|
+
"\u03CE": "ṓ" # ώ
|
598
|
+
"\u03CA": "ï" # ϊ
|
599
|
+
"\u03CB": "ÿ" # ϋ
|
600
|
+
"\u0390": "ḯ" # ΐ
|
601
|
+
"\u03B0": "ÿ́" # ΰ
|
602
|
+
|
603
|
+
"\u03DC": "W" # Ϝ
|
604
|
+
"\u03DD": "w" # ϝ
|
605
|
+
"\u03F2": "s" # ϲ
|
606
|
+
"\u03F9": "S" # Ϲ
|
607
|
+
|
608
|
+
"\u0387": ";" # ·
|
609
|
+
"\u00B7": ";" # ·
|