interscript 0.1.2 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -0,0 +1,20 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1996
4
+ language: ell
5
+ source_script: Grek
6
+ destination_script: Latn
7
+ name: BGN/PCGN 1996 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693694/ROMANIZATION_OF_GREEK.pdf
9
+ creation_date: 1996
10
+ description: |
11
+ BGN/PCGN Romanization table for Greek
12
+
13
+ note:
14
+ - Identical to ELOT 743:1982, which is also adopted as ISO 843:1997 and by UNGEGN
15
+
16
+ map:
17
+ character_separator: ""
18
+ word_separator: " "
19
+ inherit: "elot-ell-Grek-Latn-743-1982-ts"
20
+
@@ -0,0 +1,257 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1930
4
+ language: jpn
5
+ source_script: Hrkt
6
+ destination_script: Latn
7
+ name: Japanese Kana Modified Hepburn 1930 System
8
+ url:
9
+ creation_date:
10
+ adoption_date:
11
+ description:
12
+
13
+ notes:
14
+ - Segmentation needs to be done before using this map
15
+ - Note 5 in the specification states that when identical repeating vowels
16
+ belong to different kanji characters, they shall be romanized
17
+ individually and an apostrophe (’) shall be placed between the vowels.
18
+ However since this is a map from Kana to Hepburn, there is no way to
19
+ implement this feature.
20
+ - The documentation did not specify how the hyphen should be used.
21
+
22
+ tests:
23
+
24
+ - source: てがた-からみでん
25
+ expected: "Tegata-karamiden"
26
+ - source: てがた-すみよしちょう
27
+ expected: "Tegata-sumiyoshichō"
28
+ - source: さいのはま
29
+ expected: "Sainohama"
30
+ - source: てがた-たなか
31
+ expected: "Tegata-tanaka"
32
+ - source: ほりおでん
33
+ expected: "Horioden"
34
+ - source: そえがわ
35
+ expected: "Soegawa"
36
+ - source: ふねがさわ
37
+ expected: "Funegasawa"
38
+ - source: とくまんだて
39
+ expected: "Tokumandate"
40
+ - source: たてない
41
+ expected: "Tatenai"
42
+ - source: つるがさき
43
+ expected: "Tsurugasaki"
44
+ - source: しもやつせ
45
+ expected: "Shimoyatsuse"
46
+ - source: かみやつせ
47
+ expected: "Kamiyatsuse"
48
+ - source: しんとうだ
49
+ expected: "Shintōda"
50
+ - source: かじのめ
51
+ expected: "Kajinome"
52
+ - source: まえぎ
53
+ expected: "Maegi"
54
+ - source: くろさわ やま
55
+ expected: "Kurosawa Yama"
56
+ - source: いちのさわ がわ
57
+ expected: "Ichinosawa Gawa"
58
+ - source: はちやまえ
59
+ expected: "Hachiyamae"
60
+ - source: やち
61
+ expected: "Yachi"
62
+ - source: たてぬま
63
+ expected: "Tatenuma"
64
+ - source: しらはま
65
+ expected: "Shirahama"
66
+ - source: けせんまち
67
+ expected: "Kesenmachi"
68
+ - source: けいだい-かわら
69
+ expected: "Keidai-kawara"
70
+ - source: いしやました
71
+ expected: "Ishiyamashita"
72
+ - source: なえひら-やち
73
+ expected: "Naehira-yachi"
74
+ - source: とみの
75
+ expected: "Tomino"
76
+ - source: あらや-たかみまち
77
+ expected: "Araya-takamimachi"
78
+ - source: ながた
79
+ expected: "Nagata"
80
+ - source: とどろき おんせん
81
+ expected: "Todoroki Onsen"
82
+ - source: かしわぎはら
83
+ expected: "Kashiwagihara"
84
+ - source: とやけもり やま
85
+ expected: "Toyakemori Yama"
86
+ - source: なかさい
87
+ expected: "Nakasai"
88
+ - source: たけした
89
+ expected: "Takeshita"
90
+ - source: みと
91
+ expected: "Mito"
92
+ - source: みなみなかさと
93
+ expected: "Minaminakasato"
94
+ - source: みずおし
95
+ expected: "Mizuoshi"
96
+ - source: なかさと
97
+ expected: "Nakasato"
98
+ - source: しんかりば
99
+ expected: "Shinkariba"
100
+ - source: しんかみぬま
101
+ expected: "Shinkaminuma"
102
+ - source: しんばし
103
+ expected: "Shinbashi"
104
+ - source: りくぜんやました えき
105
+ expected: "Rikuzen’yamashita Eki"
106
+ - source: うしじまにし
107
+ expected: "Ushijimanishi"
108
+ - source: はまえば
109
+ expected: "Hamaeba"
110
+ - source: ぬまむかい
111
+ expected: "Numamukai"
112
+ - source: さんげんやち
113
+ expected: "Sangen’yachi"
114
+ - source: にけんやち
115
+ expected: "Niken’yachi"
116
+ - source: やちなか
117
+ expected: "Yachinaka"
118
+ - source: なす がわ
119
+ expected: "Nasu Gawa"
120
+ - source: おおはらはま
121
+ expected: "Ōharahama"
122
+ - source: うるご がわ
123
+ expected: "Urugo Gawa"
124
+ - source: なかばせ
125
+ expected: "Nakabase"
126
+ - source: うと えき
127
+ expected: "Uto Eki"
128
+ - source: みずまち
129
+ expected: "Mizumachi"
130
+ - source: ごんげんどう
131
+ expected: "Gongendō"
132
+ - source: いとひさ
133
+ expected: "Itohisa"
134
+ - source: あらおい
135
+ expected: "Araoi"
136
+ - source: わんめ
137
+ expected: "Wanme"
138
+ - source: かじろ
139
+ expected: "Kajiro"
140
+ - source: みやばら
141
+ expected: "Miyabara"
142
+ - source: いまどみ
143
+ expected: "Imadomi"
144
+ - source: かいほ
145
+ expected: "Kaiho"
146
+ - source: かいほ ぼえん
147
+ expected: "Kaiho Boen"
148
+ - source: ひきだ
149
+ expected: "Hikida"
150
+ - source: あさい-こむかい
151
+ expected: "Asai-komukai"
152
+ - source: こうざか
153
+ expected: "Kōzaka"
154
+ - source: こうふうだい
155
+ expected: "Kōfūdai"
156
+ - source: たての
157
+ expected: "Tateno"
158
+ - source: センター
159
+ expected: "Sentā"
160
+ - source: フィリピン
161
+ expected: "Firipin"
162
+ - source: ヴィオリン
163
+ expected: "Viorin"
164
+ - source: クォーター
165
+ expected: "Kwōtā"
166
+ - source: パッチリ
167
+ expected: "Patchiri"
168
+ - source: ぽっぽっや
169
+ expected: "Poppoyya"
170
+
171
+ map:
172
+ character_separator: ""
173
+ word_separator: " "
174
+ title_case: True
175
+ inherit: var-jpn-Hrkt-Latn-hepburn-1954
176
+
177
+ characters:
178
+ # Rare sounds, Table 2 & 4
179
+
180
+ "くぁ": "kwa"
181
+ "クァ": "kwa"
182
+ "ぐぁ": "gwa"
183
+ "グァ": "gwa"
184
+ "くぃ": "kwi"
185
+ "クィ": "kwi"
186
+ "ぐぃ": "gwa"
187
+ "グィ": "gwa"
188
+ "きぇ": "kye"
189
+ "キェ": "kye"
190
+ "ぎぇ": "gye"
191
+ "ギェ": "gye"
192
+ "くぇ": "kwe"
193
+ "クェ": "kwe"
194
+ "ぐぇ": "gwe"
195
+ "グェ": "gwe"
196
+ "くぉ": "kwo"
197
+ "クォ": "kwo"
198
+ "ぐぉ": "gwo"
199
+ "グォ": "gwo"
200
+ "しぇ": "she"
201
+ "シェ": "she"
202
+ "じぇ": "je"
203
+ "ジェ": "je"
204
+ "つぁ": "tsa"
205
+ "ツァ": "tsa"
206
+ "てぃ": "ti"
207
+ "ティ": "ti"
208
+ "でぃ": "di"
209
+ "ディ": "di"
210
+ "てゅ": "tyu"
211
+ "テュ": "tyu"
212
+ "でゅ": "dyu"
213
+ "デュ": "dyu"
214
+ "とゅ": "tu"
215
+ "トュ": "tu"
216
+ "どゅ": "du"
217
+ "ドュ": "du"
218
+ "ちぇ": "che"
219
+ "チェ": "che"
220
+ "ぢぇ": "je"
221
+ "ヂェ": "je"
222
+ "つぇ": "tse"
223
+ "ツェ": "tse"
224
+ "つぉ": "tso"
225
+ "ツォ": "tso"
226
+ "にぇ": "nye"
227
+ "ニェ": "nye"
228
+ "ふぁ": "fa"
229
+ "ファ": "fa"
230
+ "ふぃ": "fi"
231
+ "フィ": "fi"
232
+ "ふぇ": "fe"
233
+ "フェ": "fe"
234
+ "ふぉ": "fo"
235
+ "フォ": "fo"
236
+ "みぇ": "mye"
237
+ "ミェ": "mye"
238
+ "ぃぇ": "ye"
239
+ "ィェ": "ye"
240
+ "りぇ": "rye"
241
+ "リェ": "rye"
242
+ "ゔぁ": "va"
243
+ "ヴァ": "va"
244
+ "うぃ": "wi"
245
+ "ウィ": "wi"
246
+ "ゔぃ": "vi"
247
+ "ヴィ": "vi"
248
+ "うぇ": "we"
249
+ "ウェ": "we"
250
+ "ゔぇ": "ve"
251
+ "ヴェ": "ve"
252
+ "うぉ": "wo"
253
+ "ウォ": "wo"
254
+ "ゔぉ": "vo"
255
+ "ヴォ": "vo"
256
+ "ゔ": "vu"
257
+ "ヴ": "vu"
@@ -0,0 +1,127 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1981
4
+ language: kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF GEORGIAN; BGN/PCGN 1981 System
8
+ url: https://transliteration.eki.ee/pdf/Georgian.pdf
9
+ creation_date: 1981
10
+ confirmation_date: 1981
11
+ description: |
12
+ BGN/PCGN system of 1981.
13
+
14
+ notes:
15
+
16
+ tests:
17
+ - source: ჰებუდი
18
+ expected: hebudi
19
+
20
+ - source: ჯვრის წყალსაცავი
21
+ expected: jvris tsqalsats’avi
22
+
23
+ - source: ჯვავიაკვარა
24
+ expected: jvaviak’vara
25
+
26
+ - source: ჯობრია
27
+ expected: jobria
28
+
29
+ - source: ძულუხირა
30
+ expected: dzulukhira
31
+
32
+ - source: ლეკუხონა
33
+ expected: lek’ukhona
34
+
35
+ - source: აბაშა
36
+ expected: abasha
37
+
38
+ - source: ააცი
39
+ expected: aats’i
40
+
41
+ # TODO: This belongs to which system?!
42
+ # - source: აბააჟახვუ
43
+ # expected: abaazhvakhu
44
+
45
+ # TODO: These examples from GNDB are clearly using the BGNPCGN 2009 system
46
+ #
47
+ # - source: ხობის მუნიციპალიტეტი
48
+ # expected: khobis munitsip’alit’et’i
49
+ #
50
+ # - source: მყინვარი ჩრდილოეთი ლეადაშატი
51
+ # expected: mq’invari chrdiloeti leadashat’i
52
+ #
53
+ # - source: ხეწკვარა
54
+ # expected: khets’k’vara
55
+ #
56
+ # - source: ჯამპალი
57
+ # expected: jamp’ali
58
+ #
59
+ # - source: ჯავის მუნიციპალიტეტი
60
+ # expected: javis munitsip’alit’et’i
61
+ #
62
+ # - source: ხოიჯგეთა
63
+ # expected: khoijgeta
64
+ #
65
+ # - source: ხობის მუნიციპალიტეტი
66
+ # expected: khobis munitsip’alit’et’i
67
+ #
68
+ # - source: წვიშარხუ
69
+ # expected: ts’visharkhu
70
+ # - source: აღმოსავლეთი გუმისთა
71
+ # expected: aghmosavleti gumista
72
+ #
73
+ # - source: ქვემო ბირცხა
74
+ # expected: kvemo birtskha
75
+ #
76
+ # - source: ზემო ბირცხა
77
+ # expected: zemo birtskha
78
+ #
79
+ # - source: აბჟაყვა
80
+ # expected: abzhaq’va
81
+
82
+
83
+
84
+ map:
85
+ characters:
86
+ '\u10d0' : 'a' # ა
87
+ '\u10d1' : 'b' # ბ
88
+ '\u10d2' : 'g' # გ
89
+ '\u10d3' : 'd' # დ
90
+ '\u10d4' : 'e' # ე
91
+ '\u10d5' : 'v' # ვ
92
+ '\u10d6' : 'z' # ზ
93
+
94
+ '\u10f1' : 'ey' # ჱ
95
+
96
+ '\u10d7' : 't’' # თ
97
+ '\u10d8' : 'i' # ი
98
+ '\u10d9' : 'k’' # კ
99
+ '\u10da' : 'l' # ლ
100
+ '\u10db' : 'm' # მ
101
+ '\u10dc' : 'n' # ნ
102
+
103
+ '\u10f2' : 'j' # ჲ
104
+
105
+ '\u10dd' : 'o' # ო
106
+ '\u10de' : 'p' # პ
107
+ '\u10df' : 'zh' # ჟ
108
+ '\u10e0' : 'r' # რ
109
+ '\u10e1' : 's' # ს
110
+ '\u10e2' : 't' # ტ
111
+ '\u10e3' : 'u' # უ
112
+ '\u10e4' : 'p’' # ფ
113
+ '\u10e5' : 'k’' # ქ
114
+ '\u10e6' : 'gh' # ღ
115
+ '\u10e7' : 'q' # ყ
116
+ '\u10e8' : 'sh' # შ
117
+ '\u10e9' : 'ch’' # ჩ
118
+ '\u10ea' : 'ts’' # ც
119
+ '\u10eb' : 'dz' # ძ
120
+ '\u10ec' : 'ts' # წ
121
+ '\u10ed' : 'ch' # ჭ
122
+ '\u10ee' : 'kh' # ხ
123
+
124
+ '\u10f4' : 'q’' # ჴ
125
+
126
+ '\u10ef' : 'j' # ჯ
127
+ '\u10f0' : 'h' # ჰ
@@ -0,0 +1,43 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2009
4
+ language: kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF GEORGIAN; Georgia 2011 national system; BGN/PCGN 2009 Agreement
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/810202/ROMANIZATION_OF_GEORGIAN.pdf
9
+ creation_date: 2009
10
+ confirmation_date: 2011
11
+ description: |
12
+ This romanization system corresponds to that devised in 2002 by the
13
+ State Department of Geodesy and Cartography of Georgia and the
14
+ Institute of Linguistics of the Georgian Academy of Sciences, and
15
+ approved by Presidential Decree 109 of 24 February 2011. It represents
16
+ the Mkhedruli alphabet, as presently used in Georgia. This system was
17
+ adopted by BGN and PCGN in 2009, superseding the BGN/PCGN system of
18
+ 1981.
19
+
20
+ notes:
21
+ - This system denotes ejective (glottalised) consonants by means of
22
+ an apostrophe. The BGN/PCGN 1981 system instead used the apostrophe to
23
+ denote aspirated consonants (letters 8, 21, 22, 26 & 27).
24
+ - The Romanization columns show only lowercase forms but, when
25
+ romanizing, uppercase and lowercase Roman letters as appropriate should
26
+ be used.
27
+
28
+ tests:
29
+ - source: თბილისი
30
+ expected: tbilisi
31
+
32
+ - source: მეღვინეთუხუცესი
33
+ expected: meghvinetukhutsesi
34
+
35
+ - source: ჭიანჭველა
36
+ expected: ch’ianch’vela
37
+
38
+ - source: ბაყაყი
39
+ expected: baq’aq’i
40
+
41
+ map:
42
+ inherit: "ggg-kat-Geor-Latn-2002"
43
+