interscript 0.1.1 → 0.1.2

Sign up to get free protection for your applications and to get access to all the features.
@@ -0,0 +1,273 @@
1
+ ---
2
+ authority_id: iso
3
+ id: iso9
4
+ language: rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ISO 9
8
+ url: https://www.iso.org/standard/3589.html
9
+ creation_date: 1995
10
+ description: |
11
+ Establishes a system for the transliteration into Latin characters of
12
+ Cyrillic characters constituting the alphabets of Slavic and non-Slavic
13
+ languages. Table 3 includes in a single sequence, listed in the
14
+ Cyrillic alphabetic order, the 118 single or diacritic-carrying
15
+ characters that appear in one or another of the considered alphabets.
16
+ tests:
17
+ - source:
18
+ expected:
19
+
20
+ map:
21
+ characters:
22
+ "\u0410": "A" # А => A
23
+ "\u04d2": "\u00c4" # Ӓ => Ä (a diaeresis)
24
+ "\u04d2\u0304": "\u1ea0\u0308" # Ӓ̄ => Ạ̈ (a diaeresis and dot below)
25
+ "\u04d0": "\u0102" # Ӑ => Ă (a breve)
26
+ "\u0410\u0304": "\u0100" # А̄ => Ā (a macron)
27
+ "\u04d4": "\u00c6" # Ӕ => Æ (ae ligature)
28
+ "\u0410\u0301": "\u00c1" # А́ => Á (a acute)
29
+ "\u0410\u030a": "\u00c5" # А̊ => Å (a ring)
30
+ "\u0411": "B" # Б => B
31
+ "\u0412": "V" # В => V
32
+ "\u0413": "G" # Г => G
33
+ "\u0403": "\u01f4" # Ѓ => Ǵ (g acute)
34
+ "\u0492": "\u0120" # Ғ => Ġ (g dot)
35
+ "\u0494": "\u011e" # Ҕ => Ğ (g breve)
36
+ "\u04ba": "\u1e24" # Һ => Ḥ (h dot)
37
+ "\u0414": "D" # Д => D
38
+ "\u0402": "\u0110" # Ђ => Đ (d macron)
39
+ "\u0415": "E" # Е => E
40
+ "\u04d6": "\u0114" # Ӗ => Ĕ (e breve)
41
+ "\u0401": "\u00cb" # Ё => Ë (e diaeresis)
42
+ "\u0404": "\u00ca" # Є => Ê (e circumflex)
43
+ "\u0416": "\u017d" # Ж => Ž (z caron)
44
+ "\u0496": "\u017d\u0327" # Җ => Ž̧ (z caron and cedilla[4])
45
+ "\u04dc": "\u005a\u0304" # Ӝ => Z̄ (z macron)
46
+ "\u04c1": "\u005a\u0306" # Ӂ => Z̆ (z breve)
47
+ "\u0417": "\u005a" # З => Z
48
+ "\u04de": "\u005a\u0308" # Ӟ => Z̈ (z diaeresis)
49
+ "\u04e0": "\u0179" # Ӡ => Ź (z acute)
50
+ "\u0405": "\u1e90" # Ѕ => Ẑ (z circumflex)
51
+ "\u0418": "I" # И => I
52
+ "\u04e2": "\u012a" # Ӣ => Ī (i macron)
53
+ "\u0418\u0301": "\u00cd" # И́ => Í (i acute)
54
+ "\u04e4": "\u00ce" # Ӥ => Î (i circumflex)
55
+ "\u0419": "\u004a" # Й => J
56
+ "\u0406": "\u00cc" # І => Ì (i grave)
57
+ "\u0407": "\u00cf" # Ї => Ï (i diaeresis)
58
+ "\u0406\u0304": "\u01cf" # І̄ => Ǐ (i caron (or breve))
59
+ "\u0408": "\u004a\u030c" # Ј => J̌ (j caron)
60
+ "\u0408\u0335": "\u004a\u0301" # Ј̵ => J́ (j acute)
61
+ "\u041a": "K" # К => K
62
+ "\u040c": "\u1e30" # Ќ => Ḱ (k acute)
63
+ "\u04c3": "\u1e32" # Ӄ => Ḳ (k dot below)
64
+ "\u049c": "\u004b\u0302" # Ҝ => K̂ (k circumflex)
65
+ "\u04a0": "\u01e8" # Ҡ => Ǩ (k caron)
66
+ "\u049e": "\u004b\u0304" # Ҟ => K̄ (k macron)
67
+ "\u049a": "\u0136" # Қ => Ķ (k cedilla[4])
68
+ "\u041a\u0328": "\u004b\u0300" # К̨ => K̀ (k grave)
69
+ "\u051a": "Q" # Ԛ => Q
70
+ "\u041b": "L" # Л => L
71
+ "\u0409": "\u004c\u0302" # Љ => L̂ (l circumflex)
72
+ "\u0520": "\u013b" # Ԡ => Ļ (l cedilla[4])
73
+ "\u041c": "M" # М => M
74
+ "\u041d": "N" # Н => N
75
+ "\u040a": "\u004e\u0302" # Њ => N̂ (n circumflex)
76
+ "\u04a2": "\u0145" # Ң => Ņ (n cedilla[4])
77
+ "\u04c9": "\u1e46" # Ӊ => Ṇ (n dot below)
78
+ "\u04a4": "\u1e44" # Ҥ => Ṅ (n dot)
79
+ "\u050a": "\u01f8" # Ԋ => Ǹ (n grave)
80
+ "\u0522": "\u0143" # Ԣ => Ń (n acute)
81
+ "\u04c7": "\u0147" # Ӈ => Ň (n caron)
82
+ "\u041d\u0304": "\u004e\u0304" # Н̄ => N̄ (n macron)
83
+ "\u041e": "O" # О => O
84
+ "\u04e6": "\u00d6" # Ӧ => Ö (o diaeresis)
85
+ "\u04e8": "\u00d4" # Ө => Ô (o circumflex)
86
+ "\u04ea": "\u0150" # Ӫ => Ő (o double acute)
87
+ "\u04e6\u0304": "\u1ecc\u0308" # Ӧ̄ => Ọ̈ (o diaeresis and dot below)
88
+ "\u04a8": "\u00d2" # Ҩ => Ò (o grave)
89
+ "\u041e\u0301": "\u00d3" # О́ => Ó (o acute)
90
+ "\u041e\u0304": "\u014c" # О̄ => Ō (o macron)
91
+ "\u0152": "\u0152" # Π=> Π(oe ligature)
92
+ "\u041f": "P" # П => P
93
+ "\u04a6": "\u1e54" # Ҧ => Ṕ (p acute)
94
+ "\u0524": "\u0050\u0300" # Ԥ => P̀ (p grave)
95
+ "\u0420": "R" # Р => R
96
+ "\u0421": "S" # С => S
97
+ "\u04aa": "\u015e" # Ҫ => Ş (s cedilla[4])
98
+ "\u0421\u0300": "\u0053\u0300" # С̀ => S̀ (s grave)
99
+ "\u0422": "T" # Т => T
100
+ "\u040b": "\u0106" # Ћ => Ć (c acute)
101
+ "\u050e": "\u0054\u0300" # Ԏ => T̀ (t grave)
102
+ "\u0422\u030c": "\u0164" # Т̌ => Ť (t caron)
103
+ "\u04ac": "\u0162" # Ҭ => Ţ (t cedilla[4])
104
+ "\u0423": "U" # У => U
105
+ "\u04f0": "\u00dc" # Ӱ => Ü (u diaeresis)
106
+ "\u04ee": "\u016a" # Ӯ => Ū (u macron)
107
+ "\u040e": "\u016c" # Ў => Ŭ (u breve)
108
+ "\u04f2": "\u0170" # Ӳ => Ű (u double acute)
109
+ "\u0423\u0301": "\u00da" # У́ => Ú (u acute)
110
+ "\u04f0\u0304": "\u1ee4\u0308" # Ӱ̄ => Ụ̈ (u diaeresis and dot below)
111
+ "\u04ae": "\u00d9" # Ү => Ù (u grave)
112
+ "\u04b0": "\u0055\u0307" # Ұ => U̇ (u dot)
113
+ "\u051c": "W" # Ԝ => W
114
+ "\u0424": "F" # Ф => F
115
+ "\u0425": "H" # Х => H
116
+ "\u04b2": "\u1e28" # Ҳ => Ḩ (h cedilla[4])
117
+ "\u0426": "C" # Ц => C
118
+ "\u04b4": "\u0043\u0304" # Ҵ => C̄ (c macron)
119
+ "\u040f": "\u0044\u0302" # Џ => D̂ (d circumflex)
120
+ "\u0427": "\u010c" # Ч => Č (c caron)
121
+ "\u04b6": "\u00c7" # Ҷ => Ç (c cedilla[4])
122
+ "\u04cb": "\u0043\u0323" # Ӌ => C̣ (c dot below)
123
+ "\u04f4": "\u0043\u0308" # Ӵ => C̈ (c diaeresis)
124
+ "\u04b8": "\u0108" # Ҹ => Ĉ (c circumflex)
125
+ "\u0427\u0300": "\u0043\u0300" # Ч̀ => C̀ (c grave)
126
+ "\u04bc": "\u0043\u0306" # Ҽ => C̆ (c breve)
127
+ "\u04be": "\u0043\u0328\u0306" # Ҿ => C̨̆ (c ogonek[4] and breve)
128
+ "\u0428": "\u0160" # Ш => Š (s caron)
129
+ "\u0429": "\u015c" # Щ => Ŝ (s circumflex)
130
+ "\u042a": "\u02ba" # Ъ => ʺ (modifier letter double prime[5])
131
+ "\u042b": "Y" # Ы => Y
132
+ "\u04f8": "\u0178" # Ӹ => Ÿ (y diaeresis)
133
+ "\u042b\u0304": "\u0232" # Ы̄ => Ȳ (y macron)
134
+ "\u042c": "\u02b9" # Ь => ʹ (modifier letter prime[5])
135
+ "\u042d": "\u00c8" # Э => È (e grave)
136
+ "\u04d8": "\u0041\u030b" # Ә => A̋ (a double acute)
137
+ "\u04da": "\u00c0" # Ӛ => À (a grave)
138
+ "\u042e": "\u00db" # Ю => Û (u circumflex)
139
+ "\u042e\u0304": "\u00db\u0304" # Ю̄ => Û̄ (u circumflex with macron)
140
+ "\u042f": "\u00c2" # Я => Â (a circumflex)
141
+ "\u0490": "\u0047\u0300" # Ґ => G̀ (g grave)
142
+ "\u0462": "\u011a" # Ѣ => Ě (e caron)
143
+ "\u046a": "\u01cd" # Ѫ => Ǎ (a caron)
144
+ "\u0472": "\u0046\u0300" # Ѳ => F̀ (f grave)
145
+ "\u0474": "\u1ef2" # Ѵ => Ỳ (y grave)
146
+ "\u0430": "a" # а => a
147
+ "\u04d3": "\u00e4" # ӓ => ä
148
+ "\u04d3\u0304": "\u1ea1\u0308" # ӓ̄ => ạ̈
149
+ "\u04d1": "\u0103" # ӑ => ă
150
+ "\u0430\u0304": "\u0101" # а̄ => ā
151
+ "\u04d5": "\u00e6" # ӕ => æ
152
+ "\u0430\u0301": "\u00e1" # а́ => á
153
+ "\u0430\u030a": "\u00e5" # а̊ => å
154
+ "\u0431": "b" # б => b
155
+ "\u0432": "v" # в => v
156
+ "\u0433": "g" # г => g
157
+ "\u0453": "\u01f5" # ѓ => ǵ
158
+ "\u0493": "\u0121" # ғ => ġ
159
+ "\u0495": "\u011f" # ҕ => ğ
160
+ "\u04bb": "\u1e25" # һ => ḥ
161
+ "\u0434": "d" # д => d
162
+ "\u0452": "\u0111" # ђ => đ
163
+ "\u0435": "e" # е => e
164
+ "\u04d7": "\u0115" # ӗ => ĕ
165
+ "\u0451": "\u00eb" # ё => ë
166
+ "\u0454": "\u00ea" # є => ê
167
+ "\u0436": "\u017e" # ж => ž
168
+ "\u0497": "\u017e\u0327" # җ => ž̧
169
+ "\u04dd": "\u007a\u0304" # ӝ => z̄
170
+ "\u04c2": "\u007a\u0306" # ӂ => z̆
171
+ "\u0437": "z" # з => z
172
+ "\u04df": "\u007a\u0308" # ӟ => z̈
173
+ "\u04e1": "\u017a" # ӡ => ź
174
+ "\u0455": "\u1e91" # ѕ => ẑ
175
+ "\u0438": "i" # и => i
176
+ "\u04e3": "\u012b" # ӣ => ī
177
+ "\u0438\u0301": "\u00ed" # и́ => í
178
+ "\u04e5": "\u00ee" # ӥ => î
179
+ "\u0439": "j" # й => j
180
+ "\u0456": "\u00ec" # і => ì
181
+ "\u0457": "\u00ef" # ї => ï
182
+ "\u0456\u0304": "\u01d0" # і̄ => ǐ
183
+ "\u0458": "\u01f0" # ј => ǰ
184
+ "\u0458\u0335": "\u006a\u0301" # ј̵ => j́
185
+ "\u043a": "k" # к => k
186
+ "\u045c": "\u1e31" # ќ => ḱ
187
+ "\u04c4": "\u1e33" # ӄ => ḳ
188
+ "\u049d": "\u006b\u0302" # ҝ => k̂
189
+ "\u04a1": "\u01e9" # ҡ => ǩ
190
+ "\u049f": "\u006b\u0304" # ҟ => k̄
191
+ "\u049b": "\u0137" # қ => ķ
192
+ "\u043a\u0328": "\u006b\u0300" # к̨ => k̀
193
+ "\u051b": "q" # ԛ => q
194
+ "\u043b": "l" # л => l
195
+ "\u0459": "\u006c\u0302" # љ => l̂
196
+ "\u0521": "\u013c" # ԡ => ļ
197
+ "\u043c": "m" # м => m
198
+ "\u043d": "n" # н => n
199
+ "\u045a": "\u006e\u0302" # њ => n̂
200
+ "\u04a3": "\u0146" # ң => ņ
201
+ "\u04ca": "\u1e47" # ӊ => ṇ
202
+ "\u04a5": "\u1e45" # ҥ => ṅ
203
+ "\u050b": "\u01f9" # ԋ => ǹ
204
+ "\u0523": "\u0144" # ԣ => ń
205
+ "\u04c8": "\u0148" # ӈ => ň
206
+ "\u043d\u0304": "\u006e\u0304" # н̄ => n̄
207
+ "\u043e": "o" # о => o
208
+ "\u04e7": "\u00f6" # ӧ => ö
209
+ "\u04e9": "\u00f4" # ө => ô
210
+ "\u04eb": "\u0151" # ӫ => ő
211
+ "\u043e\u0304\u0308": "\u1ecd\u0308" # о̄̈ => ọ̈
212
+ "\u04a9": "\u00f2" # ҩ => ò
213
+ "\u043e\u0301": "\u00f3" # о́ => ó
214
+ "\u043e\u0304": "\u014d" # о̄ => ō
215
+ "\u0153": "\u0153" # œ => œ
216
+ "\u043f": "p" # п => p
217
+ "\u04a7": "\u1e55" # ҧ => ṕ
218
+ "\u0525": "\u0070\u0300" # ԥ => p̀
219
+ "\u0440": "r" # р => r
220
+ "\u0441": "s" # с => s
221
+ "\u04ab": "\u015f" # ҫ => ş
222
+ "\u0441\u0300": "\u0073\u0300" # с̀ => s̀
223
+ "\u0442": "t" # т => t
224
+ "\u045b": "\u0107" # ћ => ć
225
+ "\u050f": "\u0074\u0300" # ԏ => t̀
226
+ "\u0442\u030c": "\u0165" # т̌ => ť
227
+ "\u04ad": "\u0163" # ҭ => ţ
228
+ "\u0443": "u" # у => u
229
+ "\u04f1": "\u00fc" # ӱ => ü
230
+ "\u04ef": "\u016b" # ӯ => ū
231
+ "\u045e": "\u016d" # ў => ŭ
232
+ "\u04f3": "\u0171" # ӳ => ű
233
+ "\u0443\u0301": "\u00fa" # у́ => ú
234
+ "\u04f1\u0304": "\u1ee5\u0308" # ӱ̄ => ụ̈
235
+ "\u04af": "\u00f9" # ү => ù
236
+ "\u04b1": "\u0075\u0307" # ұ => u̇
237
+ "\u051d": "w" # ԝ => w
238
+ "\u0444": "f" # ф => f
239
+ "\u0445": "h" # х => h
240
+ "\u04b3": "\u1e29" # ҳ => ḩ
241
+ "\u0446": "c" # ц => c
242
+ "\u04b5": "\u0063\u0304" # ҵ => c̄
243
+ "\u045f": "\u0064\u0302" # џ => d̂
244
+ "\u0447": "\u010d" # ч => č
245
+ "\u04b7": "\u00e7" # ҷ => ç
246
+ "\u04cc": "\u0063\u0323" # ӌ => c̣
247
+ "\u04f5": "\u0063\u0308" # ӵ => c̈
248
+ "\u04b9": "\u0109" # ҹ => ĉ
249
+ "\u0447\u0300": "\u0063\u0300" # ч̀ => c̀
250
+ "\u04bd": "\u0063\u0306" # ҽ => c̆
251
+ "\u04bf": "\u0063\u0328\u0306" # ҿ => c̨̆
252
+ "\u0448": "\u0161" # ш => š
253
+ "\u0449": "\u015d" # щ => ŝ
254
+ "\u044a": "\u02ba" # ъ => ʺ
255
+ "\u044b": "y" # ы => y
256
+ "\u04f9": "\u00ff" # ӹ => ÿ
257
+ "\u044b\u0304": "\u0233" # ы̄ => ȳ
258
+ "\u044c": "\u02b9" # ь => ʹ
259
+ "\u044d": "\u00e8" # э => è
260
+ "\u04d9": "\u0061\u030b" # ә => a̋
261
+ "\u04db": "\u00e0" # ӛ => à
262
+ "\u044e": "\u00fb" # ю => û
263
+ "\u044e\u0304": "\u00fb\u0304" # ю̄ => û̄
264
+ "\u044f": "\u00e2" # я => â
265
+ "\u0491": "\u0067\u0300" # ґ => g̀
266
+ "\u0463": "\u011b" # ѣ => ě
267
+ "\u046b": "\u01ce" # ѫ => ǎ
268
+ "\u0473": "\u0066\u0300" # ѳ => f̀
269
+ "\u0475": "\u1ef3" # ѵ => ỳ
270
+ "\u04c0": "\u2021" # Ӏ => ‡
271
+ "\u02bc": "\u0060" # ʼ => `
272
+ "\u02ee": "\u00a8" # ˮ => ¨
273
+
@@ -0,0 +1,330 @@
1
+ ---
2
+ authority_id: mext
3
+ id: hepburn
4
+ language: jpn
5
+ source_script: Hrkt
6
+ destination_script: Latn
7
+ name: Romanization of Japanese, Modified Hepburn System
8
+ url: http://www.eki.ee/wgrs/rom2_ja.htm
9
+ creation_date: 1954
10
+ adoption_date: 1954-12-09
11
+ description: |
12
+ Widely used Romanization system in customs, e.g. in passports. In
13
+ international cartographic products the Modified Hepburn System remains
14
+ the most used system.
15
+
16
+ notes:
17
+ - A small-script tu/tsu form (ッ / っ) is inserted between kana symbols to indicate a double consonant (kk, ss, ssh, tt, tts, tch, pp in Hepburn).
18
+ - ン / ん in modified Hepburn the character is romanized n’ before y or a vowel letter, n in all other cases; earlier also m was used before b, p, or m.
19
+ - Long vowels are expressed in Hepburn by placing a macron (¯) over a vowel.
20
+ - The romanization in parentheses (in modified Hepburn) is used only in those cases where the kana symbol is known to be pronounced in the manner indicated.
21
+ - The combination in parentheses is used to denote the word meaning ’big, great’.
22
+
23
+ tests:
24
+ - source: おばあさん
25
+ expected: obāsan
26
+ - source: おにいさん
27
+ expected: oniisan
28
+ - source: みずうみ
29
+ expected: mizuumi
30
+ - source: とおまわり
31
+ expected: tōmawari
32
+ - source: べんきょう
33
+ expected: benkyō
34
+ - source: じゃあく
35
+ expected: jaaku
36
+ - source: バレーボール
37
+ expected: barēbōru
38
+ - source: スーパーマン
39
+ expected: sūpāman
40
+
41
+ map:
42
+ characters:
43
+ "あ": "a"
44
+ "い": "i"
45
+ "う": "u"
46
+ "え": "e"
47
+ "お": "o"
48
+ "か": "ka"
49
+ "き": "ki"
50
+ "く": "ku"
51
+ "け":
52
+ - "ke"
53
+ - "ga" # See note 4
54
+ "こ": "ko"
55
+ "さ": "sa"
56
+ "し": "shi"
57
+ "す": "su"
58
+ "せ": "se"
59
+ "そ": "so"
60
+ "た": "ta"
61
+ "ち": "chi"
62
+ "つ": "tsu" # See note 1
63
+ "て": "te"
64
+ "と": "to"
65
+ "な": "na"
66
+ "に": "ni"
67
+ "ぬ": "nu"
68
+ "ね": "ne"
69
+ "の": "no"
70
+ "は":
71
+ - "ha"
72
+ - "wa" # See note 4
73
+ "ひ": "hi"
74
+ "ふ": "fu"
75
+ "へ":
76
+ - "he"
77
+ - "e" # See note 4
78
+ "ほ": "ho"
79
+ "ま": "ma"
80
+ "み": "mi"
81
+ "む": "mu"
82
+ "め": "me"
83
+ "も": "mo"
84
+ "ら": "ra"
85
+ "り": "ri"
86
+ "る": "ru"
87
+ "れ": "re"
88
+ "ろ": "ro"
89
+ "わ": "wa"
90
+ "ん": "n" # See note 2
91
+ "が": "ga"
92
+ "ぎ": "gi"
93
+ "ぐ": "gu"
94
+ "げ": "ge"
95
+ "ご": "go"
96
+ "ざ": "za"
97
+ "じ": "ji"
98
+ "ず": "zu"
99
+ "ぜ": "ze"
100
+ "ぞ": "zo"
101
+ "だ": "da"
102
+ "ぢ": "ji"
103
+ "づ": "zu"
104
+ "で": "de"
105
+ "ど": "do"
106
+ "ば": "ba"
107
+ "び": "bi"
108
+ "ぶ": "bu"
109
+ "べ": "be"
110
+ "ぼ": "bo"
111
+ "ぱ": "pa"
112
+ "ぴ": "pi"
113
+ "ぷ": "pu"
114
+ "ぺ": "pe"
115
+ "ぽ": "po"
116
+ "おぅ": "ō"
117
+ "おお": "ō" # See note 4
118
+ "きゃ": "kya"
119
+ "きゅ": "kyu"
120
+ "きゅぅ": "kyū"
121
+ "きょ": "kyo"
122
+ "きょぅ": "kyō"
123
+ "こぅ": "kō"
124
+ "しゃ": "sha"
125
+ "しゅ": "shu"
126
+ "しゅぅ": "shū"
127
+ "しょ": "sho"
128
+ "しょぅ": "shō"
129
+ "そぅ": "sō"
130
+ "ちゃ": "cha"
131
+ "ちゅ": "chu"
132
+ "ちゅぅ": "chū"
133
+ "ちょ": "cho"
134
+ "ちょぅ": "chō"
135
+ "とぅ": "tō"
136
+ "にゃ": "nya"
137
+ "にゅ": "nyu"
138
+ "にゅぅ": "nyū"
139
+ "にょ": "nyo"
140
+ "にょぅ": "nyō"
141
+ "のぅ": "nō"
142
+ "ひゃ": "hya"
143
+ "ひゅ": "hyu"
144
+ "ひゅぅ": "hyū"
145
+ "ひょ": "hyo"
146
+ "ひょぅ": "hyō"
147
+ "ほぅ":
148
+ - "hō"
149
+ - "ō" # See note 4
150
+ "みゃ": "mya"
151
+ "みゅ": "myu"
152
+ "みゅぅ": "myū"
153
+ "みょ": "myo"
154
+ "みょぅ": "myō"
155
+ "もぅ": "mō"
156
+ "よぅ": "yō"
157
+ "りゃ": "rya"
158
+ "りゅ": "ryu"
159
+ "りゅぅ": "ryū"
160
+ "りょ": "ryo"
161
+ "りょぅ": "ryō"
162
+ "ろぅ": "rō"
163
+ "ぎゃ": "gya"
164
+ "ぎゅ": "gyu"
165
+ "ぎゅぅ": "gyū"
166
+ "ぎょ": "gyo"
167
+ "ぎょぅ": "gyō"
168
+ "ごぅ": "gō"
169
+ "じゃ": "ja"
170
+ "じゅ": "ju"
171
+ "じゅぅ": "jū"
172
+ "じょ": "jo"
173
+ "じょぅ": "jō"
174
+ "ぞぅ": "zō"
175
+ "どぅ": "dō"
176
+ "びゃ": "bya"
177
+ "びゅ": "byu"
178
+ "びゅぅ": "byū"
179
+ "びょ": "byo"
180
+ "びょぅ": "byō"
181
+ "ぼぅ": "bō"
182
+ "ぴゃ": "pya"
183
+ "ぴゅ": "pyu"
184
+ "ぴゅぅ": "pyū"
185
+ "ぴょ": "pyo"
186
+ "ぴょぅ": "pyō"
187
+ "ぽぅ": "pō"
188
+ "ア": "a"
189
+ "イ": "i"
190
+ "ウ": "u"
191
+ "エ": "e"
192
+ "オ": "o"
193
+ "カ": "ka"
194
+ "キ": "ki"
195
+ "ク": "ku"
196
+ "ケ": "ke"
197
+ "コ": "ko"
198
+ "サ": "sa"
199
+ "シ": "shi"
200
+ "ス": "su"
201
+ "セ": "se"
202
+ "ソ": "so"
203
+ "タ": "ta"
204
+ "チ": "chi"
205
+ "ツ": "tsu" # See note 1
206
+ "テ": "te"
207
+ "ト": "to"
208
+ "ナ": "na"
209
+ "ニ": "ni"
210
+ "ヌ": "nu"
211
+ "ネ": "ne"
212
+ "ノ": "no"
213
+ "ハ":
214
+ - "ha"
215
+ - "wa" # See note 4
216
+ "ヒ": "hi"
217
+ "フ": "fu"
218
+ "ヘ":
219
+ - "he"
220
+ - "e" # See note 4
221
+ "ホ": "ho"
222
+ "マ": "ma"
223
+ "ミ": "mi"
224
+ "ム": "mu"
225
+ "メ": "me"
226
+ "モ": "mo"
227
+ "ラ": "ra"
228
+ "リ": "ri"
229
+ "ル": "ru"
230
+ "レ": "re"
231
+ "ロ": "ro"
232
+ "ワ": "wa"
233
+ "ン": "n" # See note 2
234
+ "ガ": "ga"
235
+ "ギ": "gi"
236
+ "グ": "gu"
237
+ "ゲ": "ge"
238
+ "ゴ": "go"
239
+ "ザ": "za"
240
+ "ジ": "ji"
241
+ "ズ": "zu"
242
+ "ゼ": "ze"
243
+ "ゾ": "zo"
244
+ "ダ": "da"
245
+ "ヂ": "ji"
246
+ "ヅ": "zu"
247
+ "デ": "de"
248
+ "ド": "do"
249
+ "バ": "ba"
250
+ "ビ": "bi"
251
+ "ブ": "bu"
252
+ "ベ": "be"
253
+ "ボ": "bo"
254
+ "パ": "pa"
255
+ "ピ": "pi"
256
+ "プ": "pu"
257
+ "ペ": "pe"
258
+ "ポ": "po"
259
+ "オゥ": "ō"
260
+ "オオ": "ō" # See note 4
261
+ "キャ": "kya"
262
+ "キュ": "kyu"
263
+ "キュゥ": "kyū"
264
+ "キョ": "kyo"
265
+ "キョゥ": "kyō"
266
+ "コゥ": "kō"
267
+ "シャ": "sha"
268
+ "シュ": "shu"
269
+ "シュゥ": "shū"
270
+ "ショ": "sho"
271
+ "ショゥ": "shō"
272
+ "ソゥ": "sō"
273
+ "チャ": "cha"
274
+ "チュ": "chu"
275
+ "チュゥ": "chū"
276
+ "チョ": "cho"
277
+ "チョゥ": "chō"
278
+ "トゥ": "tō"
279
+ "ニャ": "nya"
280
+ "ニュ": "nyu"
281
+ "ニュゥ": "nyū"
282
+ "ニョ": "nyo"
283
+ "ニョゥ": "nyō"
284
+ "ノゥ": "nō"
285
+ "ヒャ": "hya"
286
+ "ヒュ": "hyu"
287
+ "ヒュゥ": "hyū"
288
+ "ヒョ": "hyo"
289
+ "ヒョゥ": "hyō"
290
+ "ホゥ":
291
+ - "hō"
292
+ - "ō" # See note 4
293
+ "ミャ": "mya"
294
+ "ミュ": "myu"
295
+ "ミュゥ": "myū"
296
+ "ミョ": "myo"
297
+ "ミョゥ": "myō"
298
+ "モゥ": "mō"
299
+ "ヨゥ": "yō"
300
+ "リャ": "rya"
301
+ "リュ": "ryu"
302
+ "リュゥ": "ryū"
303
+ "リョ": "ryo"
304
+ "リョゥ": "ryō"
305
+ "ロゥ": "rō"
306
+ "ギャ": "gya"
307
+ "ギュ": "gyu"
308
+ "ギュゥ": "gyū"
309
+ "ギョ": "gyo"
310
+ "ギョゥ": "gyō"
311
+ "ゴゥ": "gō"
312
+ "ジャ": "ja"
313
+ "ジュ": "ju"
314
+ "ジュゥ": "jū"
315
+ "ジョ": "jo"
316
+ "ジョゥ": "jō"
317
+ "ゾゥ": "zō"
318
+ "ドゥ": "dō"
319
+ "ビャ": "bya"
320
+ "ビュ": "byu"
321
+ "ビュゥ": "byū"
322
+ "ビョ": "byo"
323
+ "ビョゥ": "byō"
324
+ "ボゥ": "bō"
325
+ "ピャ": "pya"
326
+ "ピュ": "pyu"
327
+ "ピュゥ": "pyū"
328
+ "ピョ": "pyo"
329
+ "ピョゥ": "pyō"
330
+ "ポゥ": "pō"