interscript 0.1.2 → 0.1.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/README.adoc +246 -14
- data/bin/interscript +38 -17
- data/bin/setup +8 -0
- data/lib/g2pwrapper.py +34 -0
- data/lib/interscript.rb +140 -16
- data/lib/interscript/command.rb +27 -0
- data/lib/interscript/mapping.rb +125 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
- data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
- data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
- data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
- data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
- data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
- data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
- data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
- data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
- data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
- data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
- data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
- data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
- data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
- data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
- data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
- data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
- data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
- data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
- data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
- data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
- data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
- data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
- data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
- data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
- data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
- data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
- data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
- data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
- data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
- data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
- data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
- data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
- data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
- data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
- data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
- data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
- data/spec/interscript/mapping_spec.rb +42 -0
- data/spec/interscript_spec.rb +20 -5
- data/spec/spec_helper.rb +3 -1
- metadata +149 -24
- data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
- data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
- data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
- data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
- data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
- data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
- data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 1996
|
|
4
|
+
language: ell
|
|
5
|
+
source_script: Grek
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: BGN/PCGN 1996 System
|
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693694/ROMANIZATION_OF_GREEK.pdf
|
|
9
|
+
creation_date: 1996
|
|
10
|
+
description: |
|
|
11
|
+
BGN/PCGN Romanization table for Greek
|
|
12
|
+
|
|
13
|
+
note:
|
|
14
|
+
- Identical to ELOT 743:1982, which is also adopted as ISO 843:1997 and by UNGEGN
|
|
15
|
+
|
|
16
|
+
map:
|
|
17
|
+
character_separator: ""
|
|
18
|
+
word_separator: " "
|
|
19
|
+
inherit: "elot-ell-Grek-Latn-743-1982-ts"
|
|
20
|
+
|
|
@@ -0,0 +1,257 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 1930
|
|
4
|
+
language: jpn
|
|
5
|
+
source_script: Hrkt
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Japanese Kana Modified Hepburn 1930 System
|
|
8
|
+
url:
|
|
9
|
+
creation_date:
|
|
10
|
+
adoption_date:
|
|
11
|
+
description:
|
|
12
|
+
|
|
13
|
+
notes:
|
|
14
|
+
- Segmentation needs to be done before using this map
|
|
15
|
+
- Note 5 in the specification states that when identical repeating vowels
|
|
16
|
+
belong to different kanji characters, they shall be romanized
|
|
17
|
+
individually and an apostrophe (’) shall be placed between the vowels.
|
|
18
|
+
However since this is a map from Kana to Hepburn, there is no way to
|
|
19
|
+
implement this feature.
|
|
20
|
+
- The documentation did not specify how the hyphen should be used.
|
|
21
|
+
|
|
22
|
+
tests:
|
|
23
|
+
|
|
24
|
+
- source: てがた-からみでん
|
|
25
|
+
expected: "Tegata-karamiden"
|
|
26
|
+
- source: てがた-すみよしちょう
|
|
27
|
+
expected: "Tegata-sumiyoshichō"
|
|
28
|
+
- source: さいのはま
|
|
29
|
+
expected: "Sainohama"
|
|
30
|
+
- source: てがた-たなか
|
|
31
|
+
expected: "Tegata-tanaka"
|
|
32
|
+
- source: ほりおでん
|
|
33
|
+
expected: "Horioden"
|
|
34
|
+
- source: そえがわ
|
|
35
|
+
expected: "Soegawa"
|
|
36
|
+
- source: ふねがさわ
|
|
37
|
+
expected: "Funegasawa"
|
|
38
|
+
- source: とくまんだて
|
|
39
|
+
expected: "Tokumandate"
|
|
40
|
+
- source: たてない
|
|
41
|
+
expected: "Tatenai"
|
|
42
|
+
- source: つるがさき
|
|
43
|
+
expected: "Tsurugasaki"
|
|
44
|
+
- source: しもやつせ
|
|
45
|
+
expected: "Shimoyatsuse"
|
|
46
|
+
- source: かみやつせ
|
|
47
|
+
expected: "Kamiyatsuse"
|
|
48
|
+
- source: しんとうだ
|
|
49
|
+
expected: "Shintōda"
|
|
50
|
+
- source: かじのめ
|
|
51
|
+
expected: "Kajinome"
|
|
52
|
+
- source: まえぎ
|
|
53
|
+
expected: "Maegi"
|
|
54
|
+
- source: くろさわ やま
|
|
55
|
+
expected: "Kurosawa Yama"
|
|
56
|
+
- source: いちのさわ がわ
|
|
57
|
+
expected: "Ichinosawa Gawa"
|
|
58
|
+
- source: はちやまえ
|
|
59
|
+
expected: "Hachiyamae"
|
|
60
|
+
- source: やち
|
|
61
|
+
expected: "Yachi"
|
|
62
|
+
- source: たてぬま
|
|
63
|
+
expected: "Tatenuma"
|
|
64
|
+
- source: しらはま
|
|
65
|
+
expected: "Shirahama"
|
|
66
|
+
- source: けせんまち
|
|
67
|
+
expected: "Kesenmachi"
|
|
68
|
+
- source: けいだい-かわら
|
|
69
|
+
expected: "Keidai-kawara"
|
|
70
|
+
- source: いしやました
|
|
71
|
+
expected: "Ishiyamashita"
|
|
72
|
+
- source: なえひら-やち
|
|
73
|
+
expected: "Naehira-yachi"
|
|
74
|
+
- source: とみの
|
|
75
|
+
expected: "Tomino"
|
|
76
|
+
- source: あらや-たかみまち
|
|
77
|
+
expected: "Araya-takamimachi"
|
|
78
|
+
- source: ながた
|
|
79
|
+
expected: "Nagata"
|
|
80
|
+
- source: とどろき おんせん
|
|
81
|
+
expected: "Todoroki Onsen"
|
|
82
|
+
- source: かしわぎはら
|
|
83
|
+
expected: "Kashiwagihara"
|
|
84
|
+
- source: とやけもり やま
|
|
85
|
+
expected: "Toyakemori Yama"
|
|
86
|
+
- source: なかさい
|
|
87
|
+
expected: "Nakasai"
|
|
88
|
+
- source: たけした
|
|
89
|
+
expected: "Takeshita"
|
|
90
|
+
- source: みと
|
|
91
|
+
expected: "Mito"
|
|
92
|
+
- source: みなみなかさと
|
|
93
|
+
expected: "Minaminakasato"
|
|
94
|
+
- source: みずおし
|
|
95
|
+
expected: "Mizuoshi"
|
|
96
|
+
- source: なかさと
|
|
97
|
+
expected: "Nakasato"
|
|
98
|
+
- source: しんかりば
|
|
99
|
+
expected: "Shinkariba"
|
|
100
|
+
- source: しんかみぬま
|
|
101
|
+
expected: "Shinkaminuma"
|
|
102
|
+
- source: しんばし
|
|
103
|
+
expected: "Shinbashi"
|
|
104
|
+
- source: りくぜんやました えき
|
|
105
|
+
expected: "Rikuzen’yamashita Eki"
|
|
106
|
+
- source: うしじまにし
|
|
107
|
+
expected: "Ushijimanishi"
|
|
108
|
+
- source: はまえば
|
|
109
|
+
expected: "Hamaeba"
|
|
110
|
+
- source: ぬまむかい
|
|
111
|
+
expected: "Numamukai"
|
|
112
|
+
- source: さんげんやち
|
|
113
|
+
expected: "Sangen’yachi"
|
|
114
|
+
- source: にけんやち
|
|
115
|
+
expected: "Niken’yachi"
|
|
116
|
+
- source: やちなか
|
|
117
|
+
expected: "Yachinaka"
|
|
118
|
+
- source: なす がわ
|
|
119
|
+
expected: "Nasu Gawa"
|
|
120
|
+
- source: おおはらはま
|
|
121
|
+
expected: "Ōharahama"
|
|
122
|
+
- source: うるご がわ
|
|
123
|
+
expected: "Urugo Gawa"
|
|
124
|
+
- source: なかばせ
|
|
125
|
+
expected: "Nakabase"
|
|
126
|
+
- source: うと えき
|
|
127
|
+
expected: "Uto Eki"
|
|
128
|
+
- source: みずまち
|
|
129
|
+
expected: "Mizumachi"
|
|
130
|
+
- source: ごんげんどう
|
|
131
|
+
expected: "Gongendō"
|
|
132
|
+
- source: いとひさ
|
|
133
|
+
expected: "Itohisa"
|
|
134
|
+
- source: あらおい
|
|
135
|
+
expected: "Araoi"
|
|
136
|
+
- source: わんめ
|
|
137
|
+
expected: "Wanme"
|
|
138
|
+
- source: かじろ
|
|
139
|
+
expected: "Kajiro"
|
|
140
|
+
- source: みやばら
|
|
141
|
+
expected: "Miyabara"
|
|
142
|
+
- source: いまどみ
|
|
143
|
+
expected: "Imadomi"
|
|
144
|
+
- source: かいほ
|
|
145
|
+
expected: "Kaiho"
|
|
146
|
+
- source: かいほ ぼえん
|
|
147
|
+
expected: "Kaiho Boen"
|
|
148
|
+
- source: ひきだ
|
|
149
|
+
expected: "Hikida"
|
|
150
|
+
- source: あさい-こむかい
|
|
151
|
+
expected: "Asai-komukai"
|
|
152
|
+
- source: こうざか
|
|
153
|
+
expected: "Kōzaka"
|
|
154
|
+
- source: こうふうだい
|
|
155
|
+
expected: "Kōfūdai"
|
|
156
|
+
- source: たての
|
|
157
|
+
expected: "Tateno"
|
|
158
|
+
- source: センター
|
|
159
|
+
expected: "Sentā"
|
|
160
|
+
- source: フィリピン
|
|
161
|
+
expected: "Firipin"
|
|
162
|
+
- source: ヴィオリン
|
|
163
|
+
expected: "Viorin"
|
|
164
|
+
- source: クォーター
|
|
165
|
+
expected: "Kwōtā"
|
|
166
|
+
- source: パッチリ
|
|
167
|
+
expected: "Patchiri"
|
|
168
|
+
- source: ぽっぽっや
|
|
169
|
+
expected: "Poppoyya"
|
|
170
|
+
|
|
171
|
+
map:
|
|
172
|
+
character_separator: ""
|
|
173
|
+
word_separator: " "
|
|
174
|
+
title_case: True
|
|
175
|
+
inherit: var-jpn-Hrkt-Latn-hepburn-1954
|
|
176
|
+
|
|
177
|
+
characters:
|
|
178
|
+
# Rare sounds, Table 2 & 4
|
|
179
|
+
|
|
180
|
+
"くぁ": "kwa"
|
|
181
|
+
"クァ": "kwa"
|
|
182
|
+
"ぐぁ": "gwa"
|
|
183
|
+
"グァ": "gwa"
|
|
184
|
+
"くぃ": "kwi"
|
|
185
|
+
"クィ": "kwi"
|
|
186
|
+
"ぐぃ": "gwa"
|
|
187
|
+
"グィ": "gwa"
|
|
188
|
+
"きぇ": "kye"
|
|
189
|
+
"キェ": "kye"
|
|
190
|
+
"ぎぇ": "gye"
|
|
191
|
+
"ギェ": "gye"
|
|
192
|
+
"くぇ": "kwe"
|
|
193
|
+
"クェ": "kwe"
|
|
194
|
+
"ぐぇ": "gwe"
|
|
195
|
+
"グェ": "gwe"
|
|
196
|
+
"くぉ": "kwo"
|
|
197
|
+
"クォ": "kwo"
|
|
198
|
+
"ぐぉ": "gwo"
|
|
199
|
+
"グォ": "gwo"
|
|
200
|
+
"しぇ": "she"
|
|
201
|
+
"シェ": "she"
|
|
202
|
+
"じぇ": "je"
|
|
203
|
+
"ジェ": "je"
|
|
204
|
+
"つぁ": "tsa"
|
|
205
|
+
"ツァ": "tsa"
|
|
206
|
+
"てぃ": "ti"
|
|
207
|
+
"ティ": "ti"
|
|
208
|
+
"でぃ": "di"
|
|
209
|
+
"ディ": "di"
|
|
210
|
+
"てゅ": "tyu"
|
|
211
|
+
"テュ": "tyu"
|
|
212
|
+
"でゅ": "dyu"
|
|
213
|
+
"デュ": "dyu"
|
|
214
|
+
"とゅ": "tu"
|
|
215
|
+
"トュ": "tu"
|
|
216
|
+
"どゅ": "du"
|
|
217
|
+
"ドュ": "du"
|
|
218
|
+
"ちぇ": "che"
|
|
219
|
+
"チェ": "che"
|
|
220
|
+
"ぢぇ": "je"
|
|
221
|
+
"ヂェ": "je"
|
|
222
|
+
"つぇ": "tse"
|
|
223
|
+
"ツェ": "tse"
|
|
224
|
+
"つぉ": "tso"
|
|
225
|
+
"ツォ": "tso"
|
|
226
|
+
"にぇ": "nye"
|
|
227
|
+
"ニェ": "nye"
|
|
228
|
+
"ふぁ": "fa"
|
|
229
|
+
"ファ": "fa"
|
|
230
|
+
"ふぃ": "fi"
|
|
231
|
+
"フィ": "fi"
|
|
232
|
+
"ふぇ": "fe"
|
|
233
|
+
"フェ": "fe"
|
|
234
|
+
"ふぉ": "fo"
|
|
235
|
+
"フォ": "fo"
|
|
236
|
+
"みぇ": "mye"
|
|
237
|
+
"ミェ": "mye"
|
|
238
|
+
"ぃぇ": "ye"
|
|
239
|
+
"ィェ": "ye"
|
|
240
|
+
"りぇ": "rye"
|
|
241
|
+
"リェ": "rye"
|
|
242
|
+
"ゔぁ": "va"
|
|
243
|
+
"ヴァ": "va"
|
|
244
|
+
"うぃ": "wi"
|
|
245
|
+
"ウィ": "wi"
|
|
246
|
+
"ゔぃ": "vi"
|
|
247
|
+
"ヴィ": "vi"
|
|
248
|
+
"うぇ": "we"
|
|
249
|
+
"ウェ": "we"
|
|
250
|
+
"ゔぇ": "ve"
|
|
251
|
+
"ヴェ": "ve"
|
|
252
|
+
"うぉ": "wo"
|
|
253
|
+
"ウォ": "wo"
|
|
254
|
+
"ゔぉ": "vo"
|
|
255
|
+
"ヴォ": "vo"
|
|
256
|
+
"ゔ": "vu"
|
|
257
|
+
"ヴ": "vu"
|
|
@@ -0,0 +1,127 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 1981
|
|
4
|
+
language: kat
|
|
5
|
+
source_script: Geor
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ROMANIZATION OF GEORGIAN; BGN/PCGN 1981 System
|
|
8
|
+
url: https://transliteration.eki.ee/pdf/Georgian.pdf
|
|
9
|
+
creation_date: 1981
|
|
10
|
+
confirmation_date: 1981
|
|
11
|
+
description: |
|
|
12
|
+
BGN/PCGN system of 1981.
|
|
13
|
+
|
|
14
|
+
notes:
|
|
15
|
+
|
|
16
|
+
tests:
|
|
17
|
+
- source: ჰებუდი
|
|
18
|
+
expected: hebudi
|
|
19
|
+
|
|
20
|
+
- source: ჯვრის წყალსაცავი
|
|
21
|
+
expected: jvris tsqalsats’avi
|
|
22
|
+
|
|
23
|
+
- source: ჯვავიაკვარა
|
|
24
|
+
expected: jvaviak’vara
|
|
25
|
+
|
|
26
|
+
- source: ჯობრია
|
|
27
|
+
expected: jobria
|
|
28
|
+
|
|
29
|
+
- source: ძულუხირა
|
|
30
|
+
expected: dzulukhira
|
|
31
|
+
|
|
32
|
+
- source: ლეკუხონა
|
|
33
|
+
expected: lek’ukhona
|
|
34
|
+
|
|
35
|
+
- source: აბაშა
|
|
36
|
+
expected: abasha
|
|
37
|
+
|
|
38
|
+
- source: ააცი
|
|
39
|
+
expected: aats’i
|
|
40
|
+
|
|
41
|
+
# TODO: This belongs to which system?!
|
|
42
|
+
# - source: აბააჟახვუ
|
|
43
|
+
# expected: abaazhvakhu
|
|
44
|
+
|
|
45
|
+
# TODO: These examples from GNDB are clearly using the BGNPCGN 2009 system
|
|
46
|
+
#
|
|
47
|
+
# - source: ხობის მუნიციპალიტეტი
|
|
48
|
+
# expected: khobis munitsip’alit’et’i
|
|
49
|
+
#
|
|
50
|
+
# - source: მყინვარი ჩრდილოეთი ლეადაშატი
|
|
51
|
+
# expected: mq’invari chrdiloeti leadashat’i
|
|
52
|
+
#
|
|
53
|
+
# - source: ხეწკვარა
|
|
54
|
+
# expected: khets’k’vara
|
|
55
|
+
#
|
|
56
|
+
# - source: ჯამპალი
|
|
57
|
+
# expected: jamp’ali
|
|
58
|
+
#
|
|
59
|
+
# - source: ჯავის მუნიციპალიტეტი
|
|
60
|
+
# expected: javis munitsip’alit’et’i
|
|
61
|
+
#
|
|
62
|
+
# - source: ხოიჯგეთა
|
|
63
|
+
# expected: khoijgeta
|
|
64
|
+
#
|
|
65
|
+
# - source: ხობის მუნიციპალიტეტი
|
|
66
|
+
# expected: khobis munitsip’alit’et’i
|
|
67
|
+
#
|
|
68
|
+
# - source: წვიშარხუ
|
|
69
|
+
# expected: ts’visharkhu
|
|
70
|
+
# - source: აღმოსავლეთი გუმისთა
|
|
71
|
+
# expected: aghmosavleti gumista
|
|
72
|
+
#
|
|
73
|
+
# - source: ქვემო ბირცხა
|
|
74
|
+
# expected: kvemo birtskha
|
|
75
|
+
#
|
|
76
|
+
# - source: ზემო ბირცხა
|
|
77
|
+
# expected: zemo birtskha
|
|
78
|
+
#
|
|
79
|
+
# - source: აბჟაყვა
|
|
80
|
+
# expected: abzhaq’va
|
|
81
|
+
|
|
82
|
+
|
|
83
|
+
|
|
84
|
+
map:
|
|
85
|
+
characters:
|
|
86
|
+
'\u10d0' : 'a' # ა
|
|
87
|
+
'\u10d1' : 'b' # ბ
|
|
88
|
+
'\u10d2' : 'g' # გ
|
|
89
|
+
'\u10d3' : 'd' # დ
|
|
90
|
+
'\u10d4' : 'e' # ე
|
|
91
|
+
'\u10d5' : 'v' # ვ
|
|
92
|
+
'\u10d6' : 'z' # ზ
|
|
93
|
+
|
|
94
|
+
'\u10f1' : 'ey' # ჱ
|
|
95
|
+
|
|
96
|
+
'\u10d7' : 't’' # თ
|
|
97
|
+
'\u10d8' : 'i' # ი
|
|
98
|
+
'\u10d9' : 'k’' # კ
|
|
99
|
+
'\u10da' : 'l' # ლ
|
|
100
|
+
'\u10db' : 'm' # მ
|
|
101
|
+
'\u10dc' : 'n' # ნ
|
|
102
|
+
|
|
103
|
+
'\u10f2' : 'j' # ჲ
|
|
104
|
+
|
|
105
|
+
'\u10dd' : 'o' # ო
|
|
106
|
+
'\u10de' : 'p' # პ
|
|
107
|
+
'\u10df' : 'zh' # ჟ
|
|
108
|
+
'\u10e0' : 'r' # რ
|
|
109
|
+
'\u10e1' : 's' # ს
|
|
110
|
+
'\u10e2' : 't' # ტ
|
|
111
|
+
'\u10e3' : 'u' # უ
|
|
112
|
+
'\u10e4' : 'p’' # ფ
|
|
113
|
+
'\u10e5' : 'k’' # ქ
|
|
114
|
+
'\u10e6' : 'gh' # ღ
|
|
115
|
+
'\u10e7' : 'q' # ყ
|
|
116
|
+
'\u10e8' : 'sh' # შ
|
|
117
|
+
'\u10e9' : 'ch’' # ჩ
|
|
118
|
+
'\u10ea' : 'ts’' # ც
|
|
119
|
+
'\u10eb' : 'dz' # ძ
|
|
120
|
+
'\u10ec' : 'ts' # წ
|
|
121
|
+
'\u10ed' : 'ch' # ჭ
|
|
122
|
+
'\u10ee' : 'kh' # ხ
|
|
123
|
+
|
|
124
|
+
'\u10f4' : 'q’' # ჴ
|
|
125
|
+
|
|
126
|
+
'\u10ef' : 'j' # ჯ
|
|
127
|
+
'\u10f0' : 'h' # ჰ
|
|
@@ -0,0 +1,43 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 2009
|
|
4
|
+
language: kat
|
|
5
|
+
source_script: Geor
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ROMANIZATION OF GEORGIAN; Georgia 2011 national system; BGN/PCGN 2009 Agreement
|
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/810202/ROMANIZATION_OF_GEORGIAN.pdf
|
|
9
|
+
creation_date: 2009
|
|
10
|
+
confirmation_date: 2011
|
|
11
|
+
description: |
|
|
12
|
+
This romanization system corresponds to that devised in 2002 by the
|
|
13
|
+
State Department of Geodesy and Cartography of Georgia and the
|
|
14
|
+
Institute of Linguistics of the Georgian Academy of Sciences, and
|
|
15
|
+
approved by Presidential Decree 109 of 24 February 2011. It represents
|
|
16
|
+
the Mkhedruli alphabet, as presently used in Georgia. This system was
|
|
17
|
+
adopted by BGN and PCGN in 2009, superseding the BGN/PCGN system of
|
|
18
|
+
1981.
|
|
19
|
+
|
|
20
|
+
notes:
|
|
21
|
+
- This system denotes ejective (glottalised) consonants by means of
|
|
22
|
+
an apostrophe. The BGN/PCGN 1981 system instead used the apostrophe to
|
|
23
|
+
denote aspirated consonants (letters 8, 21, 22, 26 & 27).
|
|
24
|
+
- The Romanization columns show only lowercase forms but, when
|
|
25
|
+
romanizing, uppercase and lowercase Roman letters as appropriate should
|
|
26
|
+
be used.
|
|
27
|
+
|
|
28
|
+
tests:
|
|
29
|
+
- source: თბილისი
|
|
30
|
+
expected: tbilisi
|
|
31
|
+
|
|
32
|
+
- source: მეღვინეთუხუცესი
|
|
33
|
+
expected: meghvinetukhutsesi
|
|
34
|
+
|
|
35
|
+
- source: ჭიანჭველა
|
|
36
|
+
expected: ch’ianch’vela
|
|
37
|
+
|
|
38
|
+
- source: ბაყაყი
|
|
39
|
+
expected: baq’aq’i
|
|
40
|
+
|
|
41
|
+
map:
|
|
42
|
+
inherit: "ggg-kat-Geor-Latn-2002"
|
|
43
|
+
|