interscript 0.1.2 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -1,354 +0,0 @@
1
- ---
2
- authority_id: un
3
- id: kunrei
4
- language: jpn
5
- source_script: Hrkt
6
- destination_script: Latn
7
- name: Romanization of Japanese, Kunrei-siki
8
- url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/econf/9th_UNCSGN_e-conf-98-47-add1.pdf
9
- creation_date: 2007
10
- adoption_date: 2007-06-29
11
- description: |
12
- The official romanization system for Japanese is the Kunrei-siki.
13
- It was officially adopted on 9 December, 1954 (Cabinet Notification No. 1, table 1).
14
-
15
- notes:
16
- - A small-script tu/tsu form (ッ / っ) is inserted between kana symbols to indicate a double consonant (kk, ss, tt, pp in Kunrei-siki).
17
- - ン / ん is romanized always n in Kunrei-siki; when it is necessary to separate the sound n from the vowel or y to follow, the apostrophe is added after the n.
18
- - Long vowels are expressed in Kunrei-siki by placing a circumflex (^) over a vowel.
19
- - The combination in parentheses is used to denote the word meaning ’big, great’.
20
-
21
- tests:
22
- - source: かんおう
23
- expected: kanô #kan'ô
24
- - source: かのう
25
- expected: kanô
26
- - source: きんゆう
27
- expected: kinyû # kin'yû
28
- - source: きにゅう
29
- expected: kinyû
30
- - source: とうきょう
31
- expected: tôkyô
32
-
33
- map:
34
- characters:
35
- "あ": "a"
36
- "い": "i"
37
- "う": "u"
38
- "え": "e"
39
- "お": "o"
40
-
41
- "か": "ka"
42
- "き": "ki"
43
- "く": "ku"
44
- "け": "ke"
45
- "こ": "ko"
46
-
47
- "さ": "sa"
48
- "し": "si"
49
- "す": "su"
50
- "せ": "se"
51
- "そ": "so"
52
-
53
- "た": "ta"
54
- "ち": "ti"
55
- "つ": "tu" # See note 1
56
- "て": "te"
57
- "と": "to"
58
-
59
- "な": "na"
60
- "に": "ni"
61
- "ぬ": "nu"
62
- "ね": "ne"
63
- "の": "no"
64
-
65
- "は": "ha"
66
- "ひ": "hi"
67
- "ふ": "hu"
68
- "へ": "he"
69
- "ほ": "ho"
70
-
71
- "ま": "ma"
72
- "み": "mi"
73
- "む": "mu"
74
- "め": "me"
75
- "も": "mo"
76
-
77
- "ら": "ra"
78
- "り": "ri"
79
- "る": "ru"
80
- "れ": "re"
81
- "ろ": "ro"
82
-
83
- "わ": "wa"
84
- "を": "o"
85
-
86
- "ん": "n" # See note 2
87
-
88
- "が": "ga"
89
- "ぎ": "gi"
90
- "ぐ": "gu"
91
- "げ": "ge"
92
- "ご": "go"
93
-
94
- "ざ": "za"
95
- "じ": "zi"
96
- "ず": "zu"
97
- "ぜ": "ze"
98
- "ぞ": "zo"
99
-
100
- "だ": "da"
101
- "ぢ": "di"
102
- "づ": "du"
103
- "で": "de"
104
- "ど": "do"
105
-
106
- "ば": "ba"
107
- "び": "bi"
108
- "ぶ": "bu"
109
- "べ": "be"
110
- "ぼ": "bo"
111
-
112
- "ぱ": "pa"
113
- "ぴ": "pi"
114
- "ぷ": "pu"
115
- "ぺ": "pe"
116
- "ぽ": "po"
117
-
118
- "おぅ": "ô"
119
- "おお": "ô" # See note 4
120
-
121
- # Officially only kya kyu kyo??
122
- "きゃ": "kya"
123
- "きゅ": "kyu"
124
- "きゅぅ": "kyû"
125
- "きょ": "kyo"
126
- "きょぅ": "kyô"
127
-
128
- # Officially not exists?
129
- "こぅ": "kô"
130
-
131
- # Officially only sya syu syo??
132
- "しゃ": "sya"
133
- "しゅ": "syu"
134
- "しゅぅ": "syû"
135
- "しょ": "syo"
136
- "しょぅ": "syô"
137
-
138
- # Supplementary
139
- "ゃ": "ya"
140
- "ゅ": "yu"
141
- "ょ": "yo"
142
- "ぅ": "u"
143
- "ょぅ": "yô"
144
- "ゅぅ": "yû"
145
-
146
- # Officially not exists?
147
- "そぅ": "sô"
148
-
149
- # Officially only tya tyu tyo??
150
- "ちゃ": "tya"
151
- "ちゅ": "tyu"
152
- "ちゅぅ": "tyû"
153
- "ちょ": "tyo"
154
- "ちょぅ": "tyô"
155
-
156
- # Officially not exists?
157
- "とぅ": "tô"
158
-
159
- # Officially only nya nyu nyo??
160
- "にゃ": "nya"
161
- "にゅ": "nyu"
162
- "にゅぅ": "nyû"
163
- "にょ": "nyo"
164
- "にょぅ": "nyô"
165
-
166
- # Officially not exists?
167
- "のぅ": "nô"
168
-
169
- "ひゃ": "hya"
170
- "ひゅ": "hyu"
171
- "ひゅぅ": "hyû"
172
- "ひょ": "hyo"
173
- "ひょぅ": "hyô"
174
- "ほぅ": "hô"
175
- "みゃ": "mya"
176
- "みゅ": "myu"
177
- "みゅぅ": "myû"
178
- "みょ": "myo"
179
- "みょぅ": "myô"
180
- "もぅ": "mô"
181
- "よぅ": "yô"
182
- "りゃ": "rya"
183
- "りゅ": "ryu"
184
- "りゅぅ": "ryû"
185
- "りょ": "ryo"
186
- "りょぅ": "ryô"
187
- "ろぅ": "rô"
188
- "ぎゃ": "gya"
189
- "ぎゅ": "gyu"
190
- "ぎゅぅ": "gyû"
191
- "ぎょ": "gyo"
192
- "ぎょぅ": "gyô"
193
- "ごぅ": "gô"
194
- "じゃ": "zya"
195
- "じゅ": "zyu"
196
- "じゅぅ": "zyû"
197
- "じょ": "zyo"
198
- "じょぅ": "zyô"
199
- "ぞぅ": "zô"
200
- "どぅ": "dô"
201
- "びゃ": "bya"
202
- "びゅ": "byu"
203
- "びゅぅ": "byû"
204
- "びょ": "byo"
205
- "びょぅ": "byô"
206
- "ぼぅ": "bô"
207
- "ぴゃ": "pya"
208
- "ぴゅ": "pyu"
209
- "ぴゅぅ": "pyû"
210
- "ぴょ": "pyo"
211
- "ぴょぅ": "pyô"
212
- "ぽぅ": "pô"
213
-
214
-
215
- "ア": "a"
216
- "イ": "i"
217
- "ウ": "u"
218
- "エ": "e"
219
- "オ": "o"
220
- "カ": "ka"
221
- "キ": "ki"
222
- "ク": "ku"
223
- "ケ": "ke"
224
- "コ": "ko"
225
- "サ": "sa"
226
- "シ": "si"
227
- "ス": "su"
228
- "セ": "se"
229
- "ソ": "so"
230
- "タ": "ta"
231
- "チ": "ti"
232
- "ツ": "tu" # See note 1
233
- "テ": "te"
234
- "ト": "to"
235
- "ナ": "na"
236
- "ニ": "ni"
237
- "ヌ": "nu"
238
- "ネ": "ne"
239
- "ノ": "no"
240
- "ハ": "ha"
241
- "ヒ": "hi"
242
- "フ": "hu"
243
- "ヘ": "he"
244
- "ホ": "ho"
245
- "マ": "ma"
246
- "ミ": "mi"
247
- "ム": "mu"
248
- "メ": "me"
249
- "モ": "mo"
250
- "ヤ": "ya"
251
- "ユ": "yu"
252
- "ヨ": "yo"
253
- "ラ": "ra"
254
- "リ": "ri"
255
- "ル": "ru"
256
- "レ": "re"
257
- "ロ": "ro"
258
- "ワ": "wa"
259
- "ン": "n" # See note 2
260
- "ガ": "ga"
261
- "ギ": "gi"
262
- "グ": "gu"
263
- "ゲ": "ge"
264
- "ゴ": "go"
265
- "ザ": "za"
266
- "ジ": "zi"
267
- "ズ": "zu"
268
- "ゼ": "ze"
269
- "ゾ": "zo"
270
- "ダ": "da"
271
- "ヂ": "di"
272
- "ヅ": "du"
273
- "デ": "de"
274
- "ド": "do"
275
- "バ": "ba"
276
- "ビ": "bi"
277
- "ブ": "bu"
278
- "ベ": "be"
279
- "ボ": "bo"
280
- "パ": "pa"
281
- "ピ": "pi"
282
- "プ": "pu"
283
- "ペ": "pe"
284
- "ポ": "po"
285
- "オゥ": "ô"
286
- "オオ": "ô" # See note 4
287
- "キャ": "kya"
288
- "キュ": "kyu"
289
- "キュゥ": "kyû"
290
- "キョ": "kyo"
291
- "キョゥ": "kyô"
292
- "コゥ": "kô"
293
- "シャ": "sya"
294
- "シュ": "syu"
295
- "シュゥ": "syû"
296
- "ショ": "syo"
297
- "ショゥ": "syô"
298
- "ソゥ": "sô"
299
- "チャ": "tya"
300
- "チュ": "tyu"
301
- "チュゥ": "tyû"
302
- "チョ": "tyo"
303
- "チョゥ": "tyô"
304
- "トゥ": "tô"
305
- "ニャ": "nya"
306
- "ニュ": "nyu"
307
- "ニュゥ": "nyû"
308
- "ニョ": "nyo"
309
- "ニョゥ": "nyô"
310
- "ノゥ": "nô"
311
- "ヒャ": "hya"
312
- "ヒュ": "hyu"
313
- "ヒュゥ": "hyû"
314
- "ヒョ": "hyo"
315
- "ヒョゥ": "hyô"
316
- "ホゥ": "hô"
317
- "ミャ": "mya"
318
- "ミュ": "myu"
319
- "ミュゥ": "myû"
320
- "ミョ": "myo"
321
- "ミョゥ": "myô"
322
- "モゥ": "mô"
323
- "ヨゥ": "yô"
324
- "リャ": "rya"
325
- "リュ": "ryu"
326
- "リュゥ": "ryû"
327
- "リョ": "ryo"
328
- "リョゥ": "ryô"
329
- "ロゥ": "rô"
330
- "ギャ": "gya"
331
- "ギュ": "gyu"
332
- "ギュゥ": "gyû"
333
- "ギョ": "gyo"
334
- "ギョゥ": "gyô"
335
- "ゴゥ": "gô"
336
- "ジャ": "zya"
337
- "ジュ": "zyu"
338
- "ジュゥ": "zyû"
339
- "ジョ": "zyo"
340
- "ジョゥ": "zyô"
341
- "ゾゥ": "zô"
342
- "ドゥ": "dô"
343
- "ビャ": "bya"
344
- "ビュ": "byu"
345
- "ビュゥ": "byû"
346
- "ビョ": "byo"
347
- "ビョゥ": "byô"
348
- "ボゥ": "bô"
349
- "ピャ": "pya"
350
- "ピュ": "pyu"
351
- "ピュゥ": "pyû"
352
- "ピョ": "pyo"
353
- "ピョゥ": "pyô"
354
- "ポゥ": "pô"