interscript 0.1.2 → 0.1.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -1,354 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: kunrei
4
- language: jpn
5
- source_script: Hrkt
6
- destination_script: Latn
7
- name: Romanization of Japanese, Kunrei-siki
8
- url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/econf/9th_UNCSGN_e-conf-98-47-add1.pdf
9
- creation_date: 2007
10
- adoption_date: 2007-06-29
11
- description: |
12
- The official romanization system for Japanese is the Kunrei-siki.
13
- It was officially adopted on 9 December, 1954 (Cabinet Notification No. 1, table 1).
14
-
15
- notes:
16
- - A small-script tu/tsu form (ッ / っ) is inserted between kana symbols to indicate a double consonant (kk, ss, tt, pp in Kunrei-siki).
17
- - ン / ん is romanized always n in Kunrei-siki; when it is necessary to separate the sound n from the vowel or y to follow, the apostrophe is added after the n.
18
- - Long vowels are expressed in Kunrei-siki by placing a circumflex (^) over a vowel.
19
- - The combination in parentheses is used to denote the word meaning ’big, great’.
20
-
21
- tests:
22
- - source: かんおう
23
- expected: kanô #kan'ô
24
- - source: かのう
25
- expected: kanô
26
- - source: きんゆう
27
- expected: kinyû # kin'yû
28
- - source: きにゅう
29
- expected: kinyû
30
- - source: とうきょう
31
- expected: tôkyô
32
-
33
- map:
34
- characters:
35
- "あ": "a"
36
- "い": "i"
37
- "う": "u"
38
- "え": "e"
39
- "お": "o"
40
-
41
- "か": "ka"
42
- "き": "ki"
43
- "く": "ku"
44
- "け": "ke"
45
- "こ": "ko"
46
-
47
- "さ": "sa"
48
- "し": "si"
49
- "す": "su"
50
- "せ": "se"
51
- "そ": "so"
52
-
53
- "た": "ta"
54
- "ち": "ti"
55
- "つ": "tu" # See note 1
56
- "て": "te"
57
- "と": "to"
58
-
59
- "な": "na"
60
- "に": "ni"
61
- "ぬ": "nu"
62
- "ね": "ne"
63
- "の": "no"
64
-
65
- "は": "ha"
66
- "ひ": "hi"
67
- "ふ": "hu"
68
- "へ": "he"
69
- "ほ": "ho"
70
-
71
- "ま": "ma"
72
- "み": "mi"
73
- "む": "mu"
74
- "め": "me"
75
- "も": "mo"
76
-
77
- "ら": "ra"
78
- "り": "ri"
79
- "る": "ru"
80
- "れ": "re"
81
- "ろ": "ro"
82
-
83
- "わ": "wa"
84
- "を": "o"
85
-
86
- "ん": "n" # See note 2
87
-
88
- "が": "ga"
89
- "ぎ": "gi"
90
- "ぐ": "gu"
91
- "げ": "ge"
92
- "ご": "go"
93
-
94
- "ざ": "za"
95
- "じ": "zi"
96
- "ず": "zu"
97
- "ぜ": "ze"
98
- "ぞ": "zo"
99
-
100
- "だ": "da"
101
- "ぢ": "di"
102
- "づ": "du"
103
- "で": "de"
104
- "ど": "do"
105
-
106
- "ば": "ba"
107
- "び": "bi"
108
- "ぶ": "bu"
109
- "べ": "be"
110
- "ぼ": "bo"
111
-
112
- "ぱ": "pa"
113
- "ぴ": "pi"
114
- "ぷ": "pu"
115
- "ぺ": "pe"
116
- "ぽ": "po"
117
-
118
- "おぅ": "ô"
119
- "おお": "ô" # See note 4
120
-
121
- # Officially only kya kyu kyo??
122
- "きゃ": "kya"
123
- "きゅ": "kyu"
124
- "きゅぅ": "kyû"
125
- "きょ": "kyo"
126
- "きょぅ": "kyô"
127
-
128
- # Officially not exists?
129
- "こぅ": "kô"
130
-
131
- # Officially only sya syu syo??
132
- "しゃ": "sya"
133
- "しゅ": "syu"
134
- "しゅぅ": "syû"
135
- "しょ": "syo"
136
- "しょぅ": "syô"
137
-
138
- # Supplementary
139
- "ゃ": "ya"
140
- "ゅ": "yu"
141
- "ょ": "yo"
142
- "ぅ": "u"
143
- "ょぅ": "yô"
144
- "ゅぅ": "yû"
145
-
146
- # Officially not exists?
147
- "そぅ": "sô"
148
-
149
- # Officially only tya tyu tyo??
150
- "ちゃ": "tya"
151
- "ちゅ": "tyu"
152
- "ちゅぅ": "tyû"
153
- "ちょ": "tyo"
154
- "ちょぅ": "tyô"
155
-
156
- # Officially not exists?
157
- "とぅ": "tô"
158
-
159
- # Officially only nya nyu nyo??
160
- "にゃ": "nya"
161
- "にゅ": "nyu"
162
- "にゅぅ": "nyû"
163
- "にょ": "nyo"
164
- "にょぅ": "nyô"
165
-
166
- # Officially not exists?
167
- "のぅ": "nô"
168
-
169
- "ひゃ": "hya"
170
- "ひゅ": "hyu"
171
- "ひゅぅ": "hyû"
172
- "ひょ": "hyo"
173
- "ひょぅ": "hyô"
174
- "ほぅ": "hô"
175
- "みゃ": "mya"
176
- "みゅ": "myu"
177
- "みゅぅ": "myû"
178
- "みょ": "myo"
179
- "みょぅ": "myô"
180
- "もぅ": "mô"
181
- "よぅ": "yô"
182
- "りゃ": "rya"
183
- "りゅ": "ryu"
184
- "りゅぅ": "ryû"
185
- "りょ": "ryo"
186
- "りょぅ": "ryô"
187
- "ろぅ": "rô"
188
- "ぎゃ": "gya"
189
- "ぎゅ": "gyu"
190
- "ぎゅぅ": "gyû"
191
- "ぎょ": "gyo"
192
- "ぎょぅ": "gyô"
193
- "ごぅ": "gô"
194
- "じゃ": "zya"
195
- "じゅ": "zyu"
196
- "じゅぅ": "zyû"
197
- "じょ": "zyo"
198
- "じょぅ": "zyô"
199
- "ぞぅ": "zô"
200
- "どぅ": "dô"
201
- "びゃ": "bya"
202
- "びゅ": "byu"
203
- "びゅぅ": "byû"
204
- "びょ": "byo"
205
- "びょぅ": "byô"
206
- "ぼぅ": "bô"
207
- "ぴゃ": "pya"
208
- "ぴゅ": "pyu"
209
- "ぴゅぅ": "pyû"
210
- "ぴょ": "pyo"
211
- "ぴょぅ": "pyô"
212
- "ぽぅ": "pô"
213
-
214
-
215
- "ア": "a"
216
- "イ": "i"
217
- "ウ": "u"
218
- "エ": "e"
219
- "オ": "o"
220
- "カ": "ka"
221
- "キ": "ki"
222
- "ク": "ku"
223
- "ケ": "ke"
224
- "コ": "ko"
225
- "サ": "sa"
226
- "シ": "si"
227
- "ス": "su"
228
- "セ": "se"
229
- "ソ": "so"
230
- "タ": "ta"
231
- "チ": "ti"
232
- "ツ": "tu" # See note 1
233
- "テ": "te"
234
- "ト": "to"
235
- "ナ": "na"
236
- "ニ": "ni"
237
- "ヌ": "nu"
238
- "ネ": "ne"
239
- "ノ": "no"
240
- "ハ": "ha"
241
- "ヒ": "hi"
242
- "フ": "hu"
243
- "ヘ": "he"
244
- "ホ": "ho"
245
- "マ": "ma"
246
- "ミ": "mi"
247
- "ム": "mu"
248
- "メ": "me"
249
- "モ": "mo"
250
- "ヤ": "ya"
251
- "ユ": "yu"
252
- "ヨ": "yo"
253
- "ラ": "ra"
254
- "リ": "ri"
255
- "ル": "ru"
256
- "レ": "re"
257
- "ロ": "ro"
258
- "ワ": "wa"
259
- "ン": "n" # See note 2
260
- "ガ": "ga"
261
- "ギ": "gi"
262
- "グ": "gu"
263
- "ゲ": "ge"
264
- "ゴ": "go"
265
- "ザ": "za"
266
- "ジ": "zi"
267
- "ズ": "zu"
268
- "ゼ": "ze"
269
- "ゾ": "zo"
270
- "ダ": "da"
271
- "ヂ": "di"
272
- "ヅ": "du"
273
- "デ": "de"
274
- "ド": "do"
275
- "バ": "ba"
276
- "ビ": "bi"
277
- "ブ": "bu"
278
- "ベ": "be"
279
- "ボ": "bo"
280
- "パ": "pa"
281
- "ピ": "pi"
282
- "プ": "pu"
283
- "ペ": "pe"
284
- "ポ": "po"
285
- "オゥ": "ô"
286
- "オオ": "ô" # See note 4
287
- "キャ": "kya"
288
- "キュ": "kyu"
289
- "キュゥ": "kyû"
290
- "キョ": "kyo"
291
- "キョゥ": "kyô"
292
- "コゥ": "kô"
293
- "シャ": "sya"
294
- "シュ": "syu"
295
- "シュゥ": "syû"
296
- "ショ": "syo"
297
- "ショゥ": "syô"
298
- "ソゥ": "sô"
299
- "チャ": "tya"
300
- "チュ": "tyu"
301
- "チュゥ": "tyû"
302
- "チョ": "tyo"
303
- "チョゥ": "tyô"
304
- "トゥ": "tô"
305
- "ニャ": "nya"
306
- "ニュ": "nyu"
307
- "ニュゥ": "nyû"
308
- "ニョ": "nyo"
309
- "ニョゥ": "nyô"
310
- "ノゥ": "nô"
311
- "ヒャ": "hya"
312
- "ヒュ": "hyu"
313
- "ヒュゥ": "hyû"
314
- "ヒョ": "hyo"
315
- "ヒョゥ": "hyô"
316
- "ホゥ": "hô"
317
- "ミャ": "mya"
318
- "ミュ": "myu"
319
- "ミュゥ": "myû"
320
- "ミョ": "myo"
321
- "ミョゥ": "myô"
322
- "モゥ": "mô"
323
- "ヨゥ": "yô"
324
- "リャ": "rya"
325
- "リュ": "ryu"
326
- "リュゥ": "ryû"
327
- "リョ": "ryo"
328
- "リョゥ": "ryô"
329
- "ロゥ": "rô"
330
- "ギャ": "gya"
331
- "ギュ": "gyu"
332
- "ギュゥ": "gyû"
333
- "ギョ": "gyo"
334
- "ギョゥ": "gyô"
335
- "ゴゥ": "gô"
336
- "ジャ": "zya"
337
- "ジュ": "zyu"
338
- "ジュゥ": "zyû"
339
- "ジョ": "zyo"
340
- "ジョゥ": "zyô"
341
- "ゾゥ": "zô"
342
- "ドゥ": "dô"
343
- "ビャ": "bya"
344
- "ビュ": "byu"
345
- "ビュゥ": "byû"
346
- "ビョ": "byo"
347
- "ビョゥ": "byô"
348
- "ボゥ": "bô"
349
- "ピャ": "pya"
350
- "ピュ": "pyu"
351
- "ピュゥ": "pyû"
352
- "ピョ": "pyo"
353
- "ピョゥ": "pyô"
354
- "ポゥ": "pô"