interscript 0.1.1 → 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,308 @@
1
+ ---
2
+ authority_id: mext
3
+ id: kunrei
4
+ language: jpn
5
+ source_script: Hrkt
6
+ destination_script: Latn
7
+ name: Romanization of Japanese, Kunrei-siki
8
+ url: http://www.eki.ee/wgrs/rom2_ja.htm
9
+ creation_date: 1954
10
+ adoption_date: 1954-12-09
11
+ description: |
12
+ The official romanization system for Japanese is the Kunrei-siki.
13
+ It was officially adopted on 9 December, 1954 (Cabinet Notification No. 1, table 1).
14
+
15
+ notes:
16
+ - A small-script tu/tsu form (ッ / っ) is inserted between kana symbols to indicate a double consonant (kk, ss, tt, pp in Kunrei-siki).
17
+ - ン / ん is romanized always n in Kunrei-siki; when it is necessary to separate the sound n from the vowel or y to follow, the apostrophe is added after the n.
18
+ - Long vowels are expressed in Kunrei-siki by placing a circumflex (^) over a vowel.
19
+ - The combination in parentheses is used to denote the word meaning ’big, great’.
20
+
21
+ tests:
22
+ - source: かんおう
23
+ expected: kanô #kan'ô
24
+ - source: かのう
25
+ expected: kanô
26
+ - source: きんゆう
27
+ expected: kinyû # kin'yû
28
+ - source: きにゅう
29
+ expected: kinyû
30
+ - source: とうきょう
31
+ expected: tôkyô
32
+
33
+ map:
34
+ characters:
35
+ "あ": "a"
36
+ "い": "i"
37
+ "う": "u"
38
+ "え": "e"
39
+ "お": "o"
40
+ "か": "ka"
41
+ "き": "ki"
42
+ "く": "ku"
43
+ "け": "ke"
44
+ "こ": "ko"
45
+ "さ": "sa"
46
+ "し": "si"
47
+ "す": "su"
48
+ "せ": "se"
49
+ "そ": "so"
50
+ "た": "ta"
51
+ "ち": "ti"
52
+ "つ": "tu" # See note 1
53
+ "て": "te"
54
+ "と": "to"
55
+ "な": "na"
56
+ "に": "ni"
57
+ "ぬ": "nu"
58
+ "ね": "ne"
59
+ "の": "no"
60
+ "は": "ha"
61
+ "ひ": "hi"
62
+ "ふ": "hu"
63
+ "へ": "he"
64
+ "ほ": "ho"
65
+ "ま": "ma"
66
+ "み": "mi"
67
+ "む": "mu"
68
+ "め": "me"
69
+ "も": "mo"
70
+ "ら": "ra"
71
+ "り": "ri"
72
+ "る": "ru"
73
+ "れ": "re"
74
+ "ろ": "ro"
75
+ "わ": "wa"
76
+ "ん": "n" # See note 2
77
+ "が": "ga"
78
+ "ぎ": "gi"
79
+ "ぐ": "gu"
80
+ "げ": "ge"
81
+ "ご": "go"
82
+ "ざ": "za"
83
+ "じ": "zi"
84
+ "ず": "zu"
85
+ "ぜ": "ze"
86
+ "ぞ": "zo"
87
+ "だ": "da"
88
+ "ぢ": "di"
89
+ "づ": "du"
90
+ "で": "de"
91
+ "ど": "do"
92
+ "ば": "ba"
93
+ "び": "bi"
94
+ "ぶ": "bu"
95
+ "べ": "be"
96
+ "ぼ": "bo"
97
+ "ぱ": "pa"
98
+ "ぴ": "pi"
99
+ "ぷ": "pu"
100
+ "ぺ": "pe"
101
+ "ぽ": "po"
102
+ "おぅ": "ô"
103
+ "おお": "ô" # See note 4
104
+ "きゃ": "kya"
105
+ "きゅ": "kyu"
106
+ "きゅぅ": "kyû"
107
+ "きょ": "kyo"
108
+ "きょぅ": "kyô"
109
+ "こぅ": "kô"
110
+ "しゃ": "sya"
111
+ "しゅ": "syu"
112
+ "しゅぅ": "syû"
113
+ "しょ": "syo"
114
+ "しょぅ": "syô"
115
+ "そぅ": "sô"
116
+ "ちゃ": "tya"
117
+ "ちゅ": "tyu"
118
+ "ちゅぅ": "tyû"
119
+ "ちょ": "tyo"
120
+ "ちょぅ": "tyô"
121
+ "とぅ": "tô"
122
+ "にゃ": "nya"
123
+ "にゅ": "nyu"
124
+ "にゅぅ": "nyû"
125
+ "にょ": "nyo"
126
+ "にょぅ": "nyô"
127
+ "のぅ": "nô"
128
+ "ひゃ": "hya"
129
+ "ひゅ": "hyu"
130
+ "ひゅぅ": "hyû"
131
+ "ひょ": "hyo"
132
+ "ひょぅ": "hyô"
133
+ "ほぅ": "hô"
134
+ "みゃ": "mya"
135
+ "みゅ": "myu"
136
+ "みゅぅ": "myû"
137
+ "みょ": "myo"
138
+ "みょぅ": "myô"
139
+ "もぅ": "mô"
140
+ "よぅ": "yô"
141
+ "りゃ": "rya"
142
+ "りゅ": "ryu"
143
+ "りゅぅ": "ryû"
144
+ "りょ": "ryo"
145
+ "りょぅ": "ryô"
146
+ "ろぅ": "rô"
147
+ "ぎゃ": "gya"
148
+ "ぎゅ": "gyu"
149
+ "ぎゅぅ": "gyû"
150
+ "ぎょ": "gyo"
151
+ "ぎょぅ": "gyô"
152
+ "ごぅ": "gô"
153
+ "じゃ": "zya"
154
+ "じゅ": "zyu"
155
+ "じゅぅ": "zyû"
156
+ "じょ": "zyo"
157
+ "じょぅ": "zyô"
158
+ "ぞぅ": "zô"
159
+ "どぅ": "dô"
160
+ "びゃ": "bya"
161
+ "びゅ": "byu"
162
+ "びゅぅ": "byû"
163
+ "びょ": "byo"
164
+ "びょぅ": "byô"
165
+ "ぼぅ": "bô"
166
+ "ぴゃ": "pya"
167
+ "ぴゅ": "pyu"
168
+ "ぴゅぅ": "pyû"
169
+ "ぴょ": "pyo"
170
+ "ぴょぅ": "pyô"
171
+ "ぽぅ": "pô"
172
+ "ア": "a"
173
+ "イ": "i"
174
+ "ウ": "u"
175
+ "エ": "e"
176
+ "オ": "o"
177
+ "カ": "ka"
178
+ "キ": "ki"
179
+ "ク": "ku"
180
+ "ケ": "ke"
181
+ "コ": "ko"
182
+ "サ": "sa"
183
+ "シ": "si"
184
+ "ス": "su"
185
+ "セ": "se"
186
+ "ソ": "so"
187
+ "タ": "ta"
188
+ "チ": "ti"
189
+ "ツ": "tu" # See note 1
190
+ "テ": "te"
191
+ "ト": "to"
192
+ "ナ": "na"
193
+ "ニ": "ni"
194
+ "ヌ": "nu"
195
+ "ネ": "ne"
196
+ "ノ": "no"
197
+ "ハ": "ha"
198
+ "ヒ": "hi"
199
+ "フ": "hu"
200
+ "ヘ": "he"
201
+ "ホ": "ho"
202
+ "マ": "ma"
203
+ "ミ": "mi"
204
+ "ム": "mu"
205
+ "メ": "me"
206
+ "モ": "mo"
207
+ "ラ": "ra"
208
+ "リ": "ri"
209
+ "ル": "ru"
210
+ "レ": "re"
211
+ "ロ": "ro"
212
+ "ワ": "wa"
213
+ "ン": "n" # See note 2
214
+ "ガ": "ga"
215
+ "ギ": "gi"
216
+ "グ": "gu"
217
+ "ゲ": "ge"
218
+ "ゴ": "go"
219
+ "ザ": "za"
220
+ "ジ": "zi"
221
+ "ズ": "zu"
222
+ "ゼ": "ze"
223
+ "ゾ": "zo"
224
+ "ダ": "da"
225
+ "ヂ": "di"
226
+ "ヅ": "du"
227
+ "デ": "de"
228
+ "ド": "do"
229
+ "バ": "ba"
230
+ "ビ": "bi"
231
+ "ブ": "bu"
232
+ "ベ": "be"
233
+ "ボ": "bo"
234
+ "パ": "pa"
235
+ "ピ": "pi"
236
+ "プ": "pu"
237
+ "ペ": "pe"
238
+ "ポ": "po"
239
+ "オゥ": "ô"
240
+ "オオ": "ô" # See note 4
241
+ "キャ": "kya"
242
+ "キュ": "kyu"
243
+ "キュゥ": "kyû"
244
+ "キョ": "kyo"
245
+ "キョゥ": "kyô"
246
+ "コゥ": "kô"
247
+ "シャ": "sya"
248
+ "シュ": "syu"
249
+ "シュゥ": "syû"
250
+ "ショ": "syo"
251
+ "ショゥ": "syô"
252
+ "ソゥ": "sô"
253
+ "チャ": "tya"
254
+ "チュ": "tyu"
255
+ "チュゥ": "tyû"
256
+ "チョ": "tyo"
257
+ "チョゥ": "tyô"
258
+ "トゥ": "tô"
259
+ "ニャ": "nya"
260
+ "ニュ": "nyu"
261
+ "ニュゥ": "nyû"
262
+ "ニョ": "nyo"
263
+ "ニョゥ": "nyô"
264
+ "ノゥ": "nô"
265
+ "ヒャ": "hya"
266
+ "ヒュ": "hyu"
267
+ "ヒュゥ": "hyû"
268
+ "ヒョ": "hyo"
269
+ "ヒョゥ": "hyô"
270
+ "ホゥ": "hô"
271
+ "ミャ": "mya"
272
+ "ミュ": "myu"
273
+ "ミュゥ": "myû"
274
+ "ミョ": "myo"
275
+ "ミョゥ": "myô"
276
+ "モゥ": "mô"
277
+ "ヨゥ": "yô"
278
+ "リャ": "rya"
279
+ "リュ": "ryu"
280
+ "リュゥ": "ryû"
281
+ "リョ": "ryo"
282
+ "リョゥ": "ryô"
283
+ "ロゥ": "rô"
284
+ "ギャ": "gya"
285
+ "ギュ": "gyu"
286
+ "ギュゥ": "gyû"
287
+ "ギョ": "gyo"
288
+ "ギョゥ": "gyô"
289
+ "ゴゥ": "gô"
290
+ "ジャ": "zya"
291
+ "ジュ": "zyu"
292
+ "ジュゥ": "zyû"
293
+ "ジョ": "zyo"
294
+ "ジョゥ": "zyô"
295
+ "ゾゥ": "zô"
296
+ "ドゥ": "dô"
297
+ "ビャ": "bya"
298
+ "ビュ": "byu"
299
+ "ビュゥ": "byû"
300
+ "ビョ": "byo"
301
+ "ビョゥ": "byô"
302
+ "ボゥ": "bô"
303
+ "ピャ": "pya"
304
+ "ピュ": "pyu"
305
+ "ピュゥ": "pyû"
306
+ "ピョ": "pyo"
307
+ "ピョゥ": "pyô"
308
+ "ポゥ": "pô"
@@ -0,0 +1,313 @@
1
+ ---
2
+ authority_id: mext
3
+ id: kunrei
4
+ language: jpn
5
+ source_script: Hrkt
6
+ destination_script: Latn
7
+ name: Romanization of Japanese, Kunrei-siki
8
+ url:
9
+ - http://www.eki.ee/wgrs/rom2_ja.htm
10
+ - https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/9th-uncsgn-docs/econf/9th_UNCSGN_e-conf-98-47-add1.pdf
11
+ creation_date: 2007
12
+ adoption_date: 2007-06-29
13
+ description: |
14
+ The official romanization system for Japanese is the Kunrei-siki.
15
+ It was officially adopted on 9 December, 1954 (Cabinet Notification No. 1, table 1).
16
+
17
+ notes:
18
+ - A small-script tu/tsu form (ッ / っ) is inserted between kana symbols to indicate a double consonant (kk, ss, tt, pp in Kunrei-siki).
19
+ - ン / ん is romanized always n in Kunrei-siki; when it is necessary to separate the sound n from the vowel or y to follow, the apostrophe is added after the n.
20
+ - Long vowels are expressed in Kunrei-siki by placing a circumflex (^) over a vowel.
21
+ - The combination in parentheses is used to denote the word meaning ’big, great’.
22
+
23
+ tests:
24
+ - source: かんおう
25
+ expected: kanô #kan'ô
26
+ - source: かのう
27
+ expected: kanô
28
+ - source: きんゆう
29
+ expected: kinyû # kin'yû
30
+ - source: きにゅう
31
+ expected: kinyû
32
+ - source: とうきょう
33
+ expected: tôkyô
34
+
35
+ map:
36
+ characters:
37
+ "あ": "a"
38
+ "い": "i"
39
+ "う": "u"
40
+ "え": "e"
41
+ "お": "o"
42
+ "か": "ka"
43
+ "き": "ki"
44
+ "く": "ku"
45
+ "け": "ke"
46
+ "こ": "ko"
47
+ "さ": "sa"
48
+ "し": "si"
49
+ "す": "su"
50
+ "せ": "se"
51
+ "そ": "so"
52
+ "た": "ta"
53
+ "ち": "ti"
54
+ "つ": "tu" # See note 1
55
+ "て": "te"
56
+ "と": "to"
57
+ "な": "na"
58
+ "に": "ni"
59
+ "ぬ": "nu"
60
+ "ね": "ne"
61
+ "の": "no"
62
+ "は": "ha"
63
+ "ひ": "hi"
64
+ "ふ": "hu"
65
+ "へ": "he"
66
+ "ほ": "ho"
67
+ "ま": "ma"
68
+ "み": "mi"
69
+ "む": "mu"
70
+ "め": "me"
71
+ "も": "mo"
72
+ "や": "ya"
73
+ "ゆ": "yu"
74
+ "よ": "yo"
75
+ "ら": "ra"
76
+ "り": "ri"
77
+ "る": "ru"
78
+ "れ": "re"
79
+ "ろ": "ro"
80
+ "わ": "wa"
81
+ "ん": "n" # See note 2
82
+ "が": "ga"
83
+ "ぎ": "gi"
84
+ "ぐ": "gu"
85
+ "げ": "ge"
86
+ "ご": "go"
87
+ "ざ": "za"
88
+ "じ": "zi"
89
+ "ず": "zu"
90
+ "ぜ": "ze"
91
+ "ぞ": "zo"
92
+ "だ": "da"
93
+ "ぢ": "di"
94
+ "づ": "du"
95
+ "で": "de"
96
+ "ど": "do"
97
+ "ば": "ba"
98
+ "び": "bi"
99
+ "ぶ": "bu"
100
+ "べ": "be"
101
+ "ぼ": "bo"
102
+ "ぱ": "pa"
103
+ "ぴ": "pi"
104
+ "ぷ": "pu"
105
+ "ぺ": "pe"
106
+ "ぽ": "po"
107
+ "おぅ": "ô"
108
+ "おお": "ô" # See note 4
109
+ "きゃ": "kya"
110
+ "きゅ": "kyu"
111
+ "きゅぅ": "kyû"
112
+ "きょ": "kyo"
113
+ "きょぅ": "kyô"
114
+ "こぅ": "kô"
115
+ "しゃ": "sya"
116
+ "しゅ": "syu"
117
+ "しゅぅ": "syû"
118
+ "しょ": "syo"
119
+ "しょぅ": "syô"
120
+ "そぅ": "sô"
121
+ "ちゃ": "tya"
122
+ "ちゅ": "tyu"
123
+ "ちゅぅ": "tyû"
124
+ "ちょ": "tyo"
125
+ "ちょぅ": "tyô"
126
+ "とぅ": "tô"
127
+ "にゃ": "nya"
128
+ "にゅ": "nyu"
129
+ "にゅぅ": "nyû"
130
+ "にょ": "nyo"
131
+ "にょぅ": "nyô"
132
+ "のぅ": "nô"
133
+ "ひゃ": "hya"
134
+ "ひゅ": "hyu"
135
+ "ひゅぅ": "hyû"
136
+ "ひょ": "hyo"
137
+ "ひょぅ": "hyô"
138
+ "ほぅ": "hô"
139
+ "みゃ": "mya"
140
+ "みゅ": "myu"
141
+ "みゅぅ": "myû"
142
+ "みょ": "myo"
143
+ "みょぅ": "myô"
144
+ "もぅ": "mô"
145
+ "よぅ": "yô"
146
+ "りゃ": "rya"
147
+ "りゅ": "ryu"
148
+ "りゅぅ": "ryû"
149
+ "りょ": "ryo"
150
+ "りょぅ": "ryô"
151
+ "ろぅ": "rô"
152
+ "ぎゃ": "gya"
153
+ "ぎゅ": "gyu"
154
+ "ぎゅぅ": "gyû"
155
+ "ぎょ": "gyo"
156
+ "ぎょぅ": "gyô"
157
+ "ごぅ": "gô"
158
+ "じゃ": "zya"
159
+ "じゅ": "zyu"
160
+ "じゅぅ": "zyû"
161
+ "じょ": "zyo"
162
+ "じょぅ": "zyô"
163
+ "ぞぅ": "zô"
164
+ "どぅ": "dô"
165
+ "びゃ": "bya"
166
+ "びゅ": "byu"
167
+ "びゅぅ": "byû"
168
+ "びょ": "byo"
169
+ "びょぅ": "byô"
170
+ "ぼぅ": "bô"
171
+ "ぴゃ": "pya"
172
+ "ぴゅ": "pyu"
173
+ "ぴゅぅ": "pyû"
174
+ "ぴょ": "pyo"
175
+ "ぴょぅ": "pyô"
176
+ "ぽぅ": "pô"
177
+ "ア": "a"
178
+ "イ": "i"
179
+ "ウ": "u"
180
+ "エ": "e"
181
+ "オ": "o"
182
+ "カ": "ka"
183
+ "キ": "ki"
184
+ "ク": "ku"
185
+ "ケ": "ke"
186
+ "コ": "ko"
187
+ "サ": "sa"
188
+ "シ": "si"
189
+ "ス": "su"
190
+ "セ": "se"
191
+ "ソ": "so"
192
+ "タ": "ta"
193
+ "チ": "ti"
194
+ "ツ": "tu" # See note 1
195
+ "テ": "te"
196
+ "ト": "to"
197
+ "ナ": "na"
198
+ "ニ": "ni"
199
+ "ヌ": "nu"
200
+ "ネ": "ne"
201
+ "ノ": "no"
202
+ "ハ": "ha"
203
+ "ヒ": "hi"
204
+ "フ": "hu"
205
+ "ヘ": "he"
206
+ "ホ": "ho"
207
+ "マ": "ma"
208
+ "ミ": "mi"
209
+ "ム": "mu"
210
+ "メ": "me"
211
+ "モ": "mo"
212
+ "ラ": "ra"
213
+ "リ": "ri"
214
+ "ル": "ru"
215
+ "レ": "re"
216
+ "ロ": "ro"
217
+ "ワ": "wa"
218
+ "ン": "n" # See note 2
219
+ "ガ": "ga"
220
+ "ギ": "gi"
221
+ "グ": "gu"
222
+ "ゲ": "ge"
223
+ "ゴ": "go"
224
+ "ザ": "za"
225
+ "ジ": "zi"
226
+ "ズ": "zu"
227
+ "ゼ": "ze"
228
+ "ゾ": "zo"
229
+ "ダ": "da"
230
+ "ヂ": "di"
231
+ "ヅ": "du"
232
+ "デ": "de"
233
+ "ド": "do"
234
+ "バ": "ba"
235
+ "ビ": "bi"
236
+ "ブ": "bu"
237
+ "ベ": "be"
238
+ "ボ": "bo"
239
+ "パ": "pa"
240
+ "ピ": "pi"
241
+ "プ": "pu"
242
+ "ペ": "pe"
243
+ "ポ": "po"
244
+ "オゥ": "ô"
245
+ "オオ": "ô" # See note 4
246
+ "キャ": "kya"
247
+ "キュ": "kyu"
248
+ "キュゥ": "kyû"
249
+ "キョ": "kyo"
250
+ "キョゥ": "kyô"
251
+ "コゥ": "kô"
252
+ "シャ": "sya"
253
+ "シュ": "syu"
254
+ "シュゥ": "syû"
255
+ "ショ": "syo"
256
+ "ショゥ": "syô"
257
+ "ソゥ": "sô"
258
+ "チャ": "tya"
259
+ "チュ": "tyu"
260
+ "チュゥ": "tyû"
261
+ "チョ": "tyo"
262
+ "チョゥ": "tyô"
263
+ "トゥ": "tô"
264
+ "ニャ": "nya"
265
+ "ニュ": "nyu"
266
+ "ニュゥ": "nyû"
267
+ "ニョ": "nyo"
268
+ "ニョゥ": "nyô"
269
+ "ノゥ": "nô"
270
+ "ヒャ": "hya"
271
+ "ヒュ": "hyu"
272
+ "ヒュゥ": "hyû"
273
+ "ヒョ": "hyo"
274
+ "ヒョゥ": "hyô"
275
+ "ホゥ": "hô"
276
+ "ミャ": "mya"
277
+ "ミュ": "myu"
278
+ "ミュゥ": "myû"
279
+ "ミョ": "myo"
280
+ "ミョゥ": "myô"
281
+ "モゥ": "mô"
282
+ "ヨゥ": "yô"
283
+ "リャ": "rya"
284
+ "リュ": "ryu"
285
+ "リュゥ": "ryû"
286
+ "リョ": "ryo"
287
+ "リョゥ": "ryô"
288
+ "ロゥ": "rô"
289
+ "ギャ": "gya"
290
+ "ギュ": "gyu"
291
+ "ギュゥ": "gyû"
292
+ "ギョ": "gyo"
293
+ "ギョゥ": "gyô"
294
+ "ゴゥ": "gô"
295
+ "ジャ": "zya"
296
+ "ジュ": "zyu"
297
+ "ジュゥ": "zyû"
298
+ "ジョ": "zyo"
299
+ "ジョゥ": "zyô"
300
+ "ゾゥ": "zô"
301
+ "ドゥ": "dô"
302
+ "ビャ": "bya"
303
+ "ビュ": "byu"
304
+ "ビュゥ": "byû"
305
+ "ビョ": "byo"
306
+ "ビョゥ": "byô"
307
+ "ボゥ": "bô"
308
+ "ピャ": "pya"
309
+ "ピュ": "pyu"
310
+ "ピュゥ": "pyû"
311
+ "ピョ": "pyo"
312
+ "ピョゥ": "pyô"
313
+ "ポゥ": "pô"