interscript 0.1.2 → 0.1.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (120) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +246 -14
  3. data/bin/interscript +38 -17
  4. data/bin/setup +8 -0
  5. data/lib/g2pwrapper.py +34 -0
  6. data/lib/interscript.rb +140 -16
  7. data/lib/interscript/command.rb +27 -0
  8. data/lib/interscript/mapping.rb +125 -0
  9. data/lib/interscript/version.rb +1 -1
  10. data/lib/model-7 +0 -0
  11. data/lib/tha-pt-b-7 +0 -0
  12. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38912 -0
  13. data/maps/alalc-bel-cyrl-latn-1997.yaml +125 -0
  14. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  15. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +94 -0
  16. data/maps/alalc-ell-Grek-Latn-1997.yaml +625 -0
  17. data/maps/alalc-ell-Grek-Latn-2010.yaml +628 -0
  18. data/maps/alalc-kat-Geok-Latn-1997.yaml +112 -0
  19. data/maps/alalc-kat-Geor-Latn-1997.yaml +146 -0
  20. data/maps/alalc-kor-Hang-Latn-1997.yaml +94 -0
  21. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  22. data/maps/alalc-mkd-cyrl-latn-1997.yaml +114 -0
  23. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +114 -0
  24. data/maps/alalc-srp-cyrl-latn-2013.yaml +135 -0
  25. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +141 -0
  26. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  27. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  28. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +57 -31
  29. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +54 -34
  30. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +294 -0
  31. data/maps/bgn-kor-Hang-Latn-1943.yaml +31 -0
  32. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  33. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  34. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  35. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -2
  36. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  37. data/maps/bgnpcgn-bel-cyrl-latn-1979.yaml +285 -0
  38. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +115 -0
  39. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +10 -64
  40. data/maps/bgnpcgn-chn-Hans-Latn-1979.yaml +7456 -0
  41. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +702 -0
  42. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +20 -0
  43. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  44. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +127 -0
  45. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +43 -0
  46. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  47. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  48. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  49. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +159 -0
  50. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  51. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +145 -64
  52. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +166 -0
  53. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +75 -2
  54. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +208 -0
  55. data/maps/by-bel-Cyrl-Latn-1998.yaml +168 -0
  56. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  57. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +685 -0
  58. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +681 -0
  59. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +20 -0
  60. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +32 -0
  61. data/maps/ggg-kat-Geor-Latn-2002.yaml +89 -0
  62. data/maps/gki-bel-cyrl-latn-1992.yaml +33 -0
  63. data/maps/gki-bel-cyrl-latn-2000.yaml +201 -0
  64. data/maps/gost-rus-cyrl-latn-16876-71-1983.yaml +186 -0
  65. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  66. data/maps/icao-bel-Cyrl-Latn-9303.yaml +108 -92
  67. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -2
  68. data/maps/icao-heb-Hebr-Latn-9303.yaml +118 -124
  69. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -2
  70. data/maps/icao-per-Arab-Latn-9303.yaml +5 -6
  71. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  72. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -2
  73. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  74. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +610 -0
  75. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +41 -0
  76. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +62 -0
  77. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +2 -3
  78. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  79. data/maps/kp-kor-Hang-Latn-2002.yaml +901 -0
  80. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  81. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  82. data/maps/moct-kor-Hang-Latn-2000.yaml +803 -0
  83. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  84. data/maps/nil-kor-Hang-Hang-jamo.yaml +11193 -0
  85. data/maps/odni-kat-Geor-Latn-2015.yaml +88 -0
  86. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  87. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  88. data/maps/royin-tha-Thai-Latn-1968.yaml +179 -0
  89. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  90. data/maps/royin-tha-Thai-Latn-1999.yaml +76 -0
  91. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +6 -7
  92. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  93. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +193 -0
  94. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  95. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  96. data/maps/un-ell-Grek-Latn-1987-tl.yaml +32 -0
  97. data/maps/un-ell-Grek-Latn-1987-ts.yaml +20 -0
  98. data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +780 -0
  99. data/maps/un-mon-Mong-Latn-2013.yaml +19 -6
  100. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  101. data/maps/un-ukr-cyrl-latn-1998.yaml +30 -0
  102. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  103. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  104. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  105. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  106. data/maps/var-kor-Kore-Latn-mr-1939.yaml +37 -0
  107. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  108. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  109. data/maps/var-zho-Hani-Latn-1979.yaml +38908 -0
  110. data/spec/interscript/mapping_spec.rb +42 -0
  111. data/spec/interscript_spec.rb +20 -5
  112. data/spec/spec_helper.rb +3 -1
  113. metadata +149 -24
  114. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  115. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  116. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  117. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  118. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  119. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  120. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
@@ -20,103 +20,119 @@ description: |
20
20
 
21
21
  This document defines the transliteration mappings used to produce
22
22
  this transcription or transliteration.
23
+
23
24
  tests:
24
- - source:
25
- expected:
25
+ - source: Бабрыковіч Аляксандр
26
+ expected: Babrykovich Aliaksandr
27
+ - source: Міховіч Марыя
28
+ expected: Mikhovich Maryia
29
+ - source: Максім
30
+ expected: Maksim
31
+ - source: Іван
32
+ expected: Ivan
33
+ - source: СВЯТЛАНА
34
+ expected: SVIATLANA
35
+ - source: Ігар
36
+ expected: Ihar
37
+ - source: Палто Алена
38
+ expected: Palto Alena
39
+ - source: Мікалай
40
+ expected: Mikalai
41
+
26
42
  map:
27
43
  # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
28
44
  characters:
29
- "\u0027": "", # '
30
- "\u0410": "A", # А
31
- "\u0411": "B", # Б
32
- "\u0414": "D", # Д
33
- "\u0401": "IO", # Ё
34
- "\u0415": "E", # Е
35
- "\u042D": "E", # Э
36
- "\u0424": "F", # Ф
37
- "\u0413": "H", # Г
38
- "\u0418": "I", # И
39
- "\u0419": "I", # Й
40
- "\u041A": "K", # К
41
- "\u041B": "L", # Л
42
- "\u041C": "M", # М
43
- "\u041D": "N", # Н
44
- "\u041E": "O", # О
45
- "\u041F": "P", # П
46
- "\u0420": "R", # Р
47
- "\u0421": "S", # С
48
- "\u0422": "T", # Т
49
- "\u0423": "U", # У
50
- "\u0412": "V", # В
51
- "\u042B": "Y", # Ы
52
- "\u0417": "Z", # З
53
- "\u0427": "CH", # Ч
54
- "\u042F": "IA", # Я
55
- "\u042E": "IU", # Ю
56
- "\u0425": "KH", # Х
57
- "\u0428": "SH", # Ш
58
- "\u0429": "SHCH", # Щ
59
- "\u0426": "TS", # Ц
60
- "\u0416": "ZH", # Ж
61
- "\u0490": "G", # Ґ
62
- "\u040E": "U", # Ў
63
- "\u046A": "U", # Ѫ
64
- "\u0402": "D", # Ђ
65
- "\u0405": "DZ", # Ѕ
66
- "\u0408": "J", # Ј
67
- "\u0409": "LJ", # Љ
68
- "\u040A": "NJ", # Њ
69
- "\u04BA": "C", # Һ
70
- "\u040F": "DZ", # Џ
71
- "\u0404": "IE", # Є
72
- "\u0407": "I", # Ї
73
- "\u0403": "G", # Ѓ
74
- "\u0406": "I", # І
45
+ "\u0027": "" # '
46
+ "\u0410": "A" # А
47
+ "\u0411": "B" # Б
48
+ "\u0414": "D" # Д
49
+ "\u0401": "IO" # Ё
50
+ "\u0415": "E" # Е
51
+ "\u042D": "E" # Э
52
+ "\u0424": "F" # Ф
53
+ "\u0413": "H" # Г
54
+ "\u0418": "I" # И
55
+ "\u0419": "I" # Й
56
+ "\u041A": "K" # К
57
+ "\u041B": "L" # Л
58
+ "\u041C": "M" # М
59
+ "\u041D": "N" # Н
60
+ "\u041E": "O" # О
61
+ "\u041F": "P" # П
62
+ "\u0420": "R" # Р
63
+ "\u0421": "S" # С
64
+ "\u0422": "T" # Т
65
+ "\u0423": "U" # У
66
+ "\u0412": "V" # В
67
+ "\u042B": "Y" # Ы
68
+ "\u0417": "Z" # З
69
+ "\u0427": "CH" # Ч
70
+ "\u042F": "IA" # Я
71
+ "\u042E": "IU" # Ю
72
+ "\u0425": "KH" # Х
73
+ "\u0428": "SH" # Ш
74
+ "\u0429": "SHCH" # Щ
75
+ "\u0426": "TS" # Ц
76
+ "\u0416": "ZH" # Ж
77
+ "\u0490": "G" # Ґ
78
+ "\u040E": "U" # Ў
79
+ "\u046A": "U" # Ѫ
80
+ "\u0402": "D" # Ђ
81
+ "\u0405": "DZ" # Ѕ
82
+ "\u0408": "J" # Ј
83
+ "\u0409": "LJ" # Љ
84
+ "\u040A": "NJ" # Њ
85
+ "\u04BA": "C" # Һ
86
+ "\u040F": "DZ" # Џ
87
+ "\u0404": "IE" # Є
88
+ "\u0407": "I" # Ї
89
+ "\u0403": "G" # Ѓ
90
+ "\u0406": "I" # І
75
91
 
76
- "\u0430": "a", # а
77
- "\u0431": "b", # б
78
- "\u0434": "d", # д
79
- "\u0451": "io", # ё
80
- "\u0435": "e", # e
81
- "\u044D": "e", # э
82
- "\u0444": "f", # ф
83
- "\u0433": "h", # г
84
- "\u0438": "i", # и
85
- "\u0439": "i", # й
86
- "\u043A": "k", # к
87
- "\u043B": "l", # л
88
- "\u043C": "m", # м
89
- "\u043D": "n", # н
90
- "\u043E": "o", # о
91
- "\u043F": "p", # п
92
- "\u0440": "r", # р
93
- "\u0441": "s", # с
94
- "\u0442": "t", # т
95
- "\u0443": "", # у
96
- "\u0432": "v", # в
97
- "\u044B": "y", # ы
98
- "\u0437": "z", # з
99
- "\u0447": "ch", # ч
100
- "\u044F": "ia", # я
101
- "\u044E": "i", # ю
102
- "\u0445": "kh", # х
103
- "\u0448": "sh", # ш
104
- "\u0449": "shch", # щ
105
- "\u0446": "ts", # ц
106
- "\u0436": "zh", # ж
107
- "\u0491": "g", # ґ
108
- "\u045E": "", # ў
109
- "\u046B": "", # ѫ
110
- "\u0452": "d", # ђ
111
- "\u0455": "dz", # ѕ
112
- "\u0458": "j", # ј
113
- "\u0459": "lj", # љ
114
- "\u045A": "nj", # њ
115
- "\u04BB": "c", # һ
116
- "\u045F": "dz", # џ
117
- "\u0454": "ie", # є
118
- "\u0457": "i", # ї
119
- "\u0453": "g", # ѓ
92
+ "\u0430": "a" # а
93
+ "\u0431": "b" # б
94
+ "\u0434": "d" # д
95
+ "\u0451": "io" # ё
96
+ "\u0435": "e" # e
97
+ "\u044D": "e" # э
98
+ "\u0444": "f" # ф
99
+ "\u0433": "h" # г
100
+ "\u0438": "i" # и
101
+ "\u0439": "i" # й
102
+ "\u043A": "k" # к
103
+ "\u043B": "l" # л
104
+ "\u043C": "m" # м
105
+ "\u043D": "n" # н
106
+ "\u043E": "o" # о
107
+ "\u043F": "p" # п
108
+ "\u0440": "r" # р
109
+ "\u0441": "s" # с
110
+ "\u0442": "t" # т
111
+ "\u0443": "" # у
112
+ "\u0432": "v" # в
113
+ "\u044B": "y" # ы
114
+ "\u0437": "z" # з
115
+ "\u0447": "ch" # ч
116
+ "\u044F": "ia" # я
117
+ "\u044E": "i" # ю
118
+ "\u0445": "kh" # х
119
+ "\u0448": "sh" # ш
120
+ "\u0449": "shch" # щ
121
+ "\u0446": "ts" # ц
122
+ "\u0436": "zh" # ж
123
+ "\u0491": "g" # ґ
124
+ "\u045E": "" # ў
125
+ "\u046B": "" # ѫ
126
+ "\u0452": "d" # ђ
127
+ "\u0455": "dz" # ѕ
128
+ "\u0458": "j" # ј
129
+ "\u0459": "lj" # љ
130
+ "\u045A": "nj" # њ
131
+ "\u04BB": "c" # һ
132
+ "\u045F": "dz" # џ
133
+ "\u0454": "ie" # є
134
+ "\u0457": "i" # ї
135
+ "\u0453": "g" # ѓ
120
136
  "\u0456": "i" # і
121
137
 
122
138
 
@@ -21,8 +21,7 @@ description: |
21
21
  This document defines the transliteration mappings used to produce
22
22
  this transcription or transliteration.
23
23
  tests:
24
- - source:
25
- expected:
24
+
26
25
  map:
27
26
  # https://www.icao.int/publications/Documents/9303_p3_cons_en.pdf
28
27
  characters:
@@ -21,137 +21,131 @@ description: |
21
21
  This document defines the transliteration mappings used to produce
22
22
  this transcription or transliteration.
23
23
  tests:
24
- - source:
25
- expected:
24
+
26
25
  map:
27
26
  # https://en.wikipedia.org/wiki/Romanization_of_Hebrew
28
27
 
29
28
  characters:
30
- "\u0027": "", # '
29
+ "\u0027": "" # '
31
30
 
32
31
  # Consonants
33
- "\u05D0": "", # א
34
- "\u05D1": "V", # ב
35
- "\u05D1\u05BC": "B", # בּ
36
- "\uFB31": "B", # בּ
37
- "\u05D2": "G", # ג
38
- "\u05D2\u05BC": "G", # גּ
39
- "\uFB32": "G", # גּ‬‬
40
- "\u05D2\u05F3": "J", # ג׳
41
- "\u05D3": "D", # ד
42
- "\u05D3\u05BC": "D", # דּ
43
- "\uFB33": "D", # דּ
44
- "\u05D3\u05F3": "DH", # ד׳
45
- "\u05D4": "H", # ה
46
- "\u05D4\u05BC": "H", # הּ
47
- "\uFB34": "H", # הּ
48
- "\u05D5": "V", # ו‬
49
- "\u05D5\u202C": "V", # ו‬
50
- "\u05D5\u05BC": "V", # וּ
51
- # "\uFB35": "V", # וּ # To vowels "U"
52
- "\u05D6": "Z", # ז
53
- "\u05D6\u05BC": "Z", # זּ
54
- "\uFB36": "Z", # זּ‬
55
- "\u05D6\u05F3": "ZH", # ז׳
56
- "\u05D7": "CH", # ח
57
- "\u05D8": "T", # ט
58
- "\u05D8\u05BC": "T", # טּ
59
- "\uFB38": "T", # טּ
60
- "\u05D9": "Y", # י
61
- "\u05D9\u05BC": "Y", # יּ
62
- "\u05D9\u05BC" +
63
- "\u202C": "Y", # יּ‬
64
- "\uFB39": "Y", # יּ‬
65
- "\u05DB": "CH", # כ
66
- "\u05DB\u05BC": "CH", # כּ
67
- "\u05DB\u05BC" +
68
- "\u202C": "CH", # כּ
69
- "\uFB3B": "C", #
70
- "\u05DA": "CH", # ך
71
- "\u05DA\u05BC": "CH", # ךּ
72
- "\u05DA\u05BC" +
73
- "\u202C": "CH", # ךּ‬
74
- "\uFB3A": "CH", #
75
- "\u05DC": "L", # ל‬
76
- "\u05DC\u05BC": "L", # לּ
77
- "\uFB3C": "L", #
78
- "\u05DD": "M", # ם
79
- "\u05DE": "M", # מ‬
80
- "\u05DE\u05BC": "M", # מּ
81
- "\uFB3E": "M", # מּ‬
82
- "\u05DF": "N", # ן
83
- "\u05E0": "N", # נ
84
- "\u05E0\u05BC": "N", # נּ
85
- "\uFB40": "N", #
86
- "\u05E1": "S", # ס
87
- "\u05E1\u05BC": "S", # סּ
88
- "\uFB41": "S", #
89
- "\u05E2": "", # ע
90
- "\u05E3": "F", # ף
91
- "\u05E3\u05BC": "P", # Possible problem u05BC # ףּ
92
- "\uFB43": "P", #
93
- "\u05E4": "F", # פ‬
94
- "\u05E4\u05BC": "P", # פּ
95
- "\uFB44": "P", #
96
- "\u05E5": "TZ", # ץ
97
- "\u05E5\u05F3": "TSH", # Possible problem u05F3 # ץ׳
98
- "\u05E6": "TZ", # צ‬
99
- "\u05E6\u05BC": "TZ", # צּ
100
- "\uFB46": "TZ", # צּ‬
101
- "\u05E6\u05F3": "TSH", # Possible problem u05F3 # צ׳
102
- "\u05E7": "Q", # ק
103
- "\u05E7\u05BC": "Q", # קּ
104
- "\uFB47": "Q", # קּ‬
105
- "\u05E8": "R", # ר
106
- "\u05E8\u05BC": "R", # רּ
107
- "\uFB48": "R", #
108
- "\u05E9": "S", # ש
109
- "\u05E9\u05BC": "S", # שּ
110
- "\uFB49": "S", # שּ‬
111
- "\u05E9\u05C2" +
112
- "\u202C": "S", # שׂ
113
- "\uFB2B": "S", #
114
- "\u05E9\u05C1": "SH", # שׁ
115
- "\uFB2A": "SH", #
116
- "\u05E9\u05BC" +
117
- "\u05C2\u202C": "S", # שּׂ‬
118
- "\uFB2D": "S", # שּׂ
119
- "\u05EA": "T", # ת
120
- "\u05EA\u05BC": "T", # תּ
121
- "\uFB4A": "T", # תּ
122
- "\u05EA\u05F3": "T", # ת׳
32
+ "\u05D0": "" # א
33
+ "\u05D1": "V" # ב
34
+ "\u05D1\u05BC": "B" # בּ
35
+ "\uFB31": "B" # בּ
36
+ "\u05D2": "G" # ג
37
+ "\u05D2\u05BC": "G" # גּ
38
+ "\uFB32": "G" # גּ‬‬
39
+ "\u05D2\u05F3": "J" # ג׳
40
+ "\u05D3": "D" # ד
41
+ "\u05D3\u05BC": "D" # דּ
42
+ "\uFB33": "D" # דּ
43
+ "\u05D3\u05F3": "DH" # ד׳
44
+ "\u05D4": "H" # ה
45
+ "\u05D4\u05BC": "H" # הּ
46
+ "\uFB34": "H" # הּ
47
+ "\u05D5": "V" # ו‬
48
+ "\u05D5\u202C": "V" # ו‬
49
+ "\u05D5\u05BC": "V" # וּ
50
+ # "\uFB35": "V" # וּ # To vowels "U"
51
+ "\u05D6": "Z" # ז
52
+ "\u05D6\u05BC": "Z" # זּ
53
+ "\uFB36": "Z" # זּ‬
54
+ "\u05D6\u05F3": "ZH" # ז׳
55
+ "\u05D7": "CH" # ח
56
+ "\u05D8": "T" # ט
57
+ "\u05D8\u05BC": "T" # טּ
58
+ "\uFB38": "T" # טּ
59
+ "\u05D9": "Y" # י
60
+ "\u05D9\u05BC": "Y" # יּ
61
+ "\u05D9\u05BC\u202C": "Y" # יּ‬
62
+ "\uFB39": "Y" # יּ‬
63
+ "\u05DB": "CH" # כ
64
+ "\u05DB\u05BC": "CH" # כּ
65
+ "\u05DB\u05BC\u202C": "CH" # כּ
66
+ "\uFB3B": "C" #
67
+ "\u05DA": "CH" # ך
68
+ "\u05DA\u05BC": "CH" # ךּ
69
+ "\u05DA\u05BC\u202C": "CH" # ךּ‬
70
+ "\uFB3A": "CH" #
71
+ "\u05DC": "L" # ל‬
72
+ "\u05DC\u05BC": "L" # לּ
73
+ "\uFB3C": "L" #
74
+ "\u05DD": "M" # ם
75
+ "\u05DE": "M" # מ‬
76
+ "\u05DE\u05BC": "M" # מּ
77
+ "\uFB3E": "M" # מּ‬
78
+ "\u05DF": "N" # ן
79
+ "\u05E0": "N" # נ
80
+ "\u05E0\u05BC": "N" # נּ
81
+ "\uFB40": "N" #
82
+ "\u05E1": "S" # ס
83
+ "\u05E1\u05BC": "S" # סּ
84
+ "\uFB41": "S" #
85
+ "\u05E2": "" # ע
86
+ "\u05E3": "F" # ף
87
+ "\u05E3\u05BC": "P" # Possible problem u05BC # ףּ
88
+ "\uFB43": "P" #
89
+ "\u05E4": "F" # פ‬
90
+ "\u05E4\u05BC": "P" # פּ
91
+ "\uFB44": "P" #
92
+ "\u05E5": "TZ" # ץ
93
+ "\u05E5\u05F3": "TSH" # Possible problem u05F3 # ץ׳
94
+ "\u05E6": "TZ" # צ‬
95
+ "\u05E6\u05BC": "TZ" # צּ
96
+ "\uFB46": "TZ" # צּ‬
97
+ "\u05E6\u05F3": "TSH" # Possible problem u05F3 # צ׳
98
+ "\u05E7": "Q" # ק
99
+ "\u05E7\u05BC": "Q" # קּ
100
+ "\uFB47": "Q" # קּ‬
101
+ "\u05E8": "R" # ר
102
+ "\u05E8\u05BC": "R" # רּ
103
+ "\uFB48": "R" #
104
+ "\u05E9": "S" # ש
105
+ "\u05E9\u05BC": "S" # שּ
106
+ "\uFB49": "S" # שּ‬
107
+ "\u05E9\u05C2\u202C": "S" # שׂ
108
+ "\uFB2B": "S" #
109
+ "\u05E9\u05C1": "SH" # שׁ
110
+ "\uFB2A": "SH" #
111
+ "\u05E9\u05BC\u05C2\u202C": "S" # שּׂ‬
112
+ "\uFB2D": "S" #
113
+ "\u05EA": "T" # ת
114
+ "\u05EA\u05BC": "T" # תּ
115
+ "\uFB4A": "T" #
116
+ "\u05EA\u05F3": "T" # ת׳
123
117
 
124
118
  # Niqqud vowels
125
- "\u05B0": "E", # ( ְ‬ )
126
- "\u05B1": "E", # ( ֱ )
127
- "\u05B2": "A", # ( ֲ )
128
- "\u05B3": "O", # ( ֲ )
129
- "\u05B4": "I", # ( ִ )
130
- "\u05B5": "E", # ( ֵ )
131
- "\u05B6": "E", # ( ֶ )
132
- "\u05B7": "A", # ( ַ )
133
- "\u05B8": "O", # ( ָ ) # It could be "A" too
134
- "\u05B9": "O", # ( ֹ )
135
- "\u05BB": "U", # ( ֻ )
136
- "\u05D5\u05BC": "U", # ( וּ )
137
- "\uFB35": "U", # ( וּ )
119
+ "\u05B0": "E" # ( ְ‬ )
120
+ "\u05B1": "E" # ( ֱ )
121
+ "\u05B2": "A" # ( ֲ )
122
+ "\u05B3": "O" # ( ֲ )
123
+ "\u05B4": "I" # ( ִ )
124
+ "\u05B5": "E" # ( ֵ )
125
+ "\u05B6": "E" # ( ֶ )
126
+ "\u05B7": "A" # ( ַ )
127
+ "\u05B8": "O" # ( ָ ) # It could be "A" too
128
+ "\u05B9": "O" # ( ֹ )
129
+ "\u05BB": "U" # ( ֻ )
130
+ "\u05D5\u05BC": "U" # ( וּ )
131
+ "\uFB35": "U" # ( וּ )
138
132
 
139
133
  # Diphthongs
140
- "\u05B5\u05D9": "EI", # ( ֵי )
141
- "\u05B6\u05D9": "EI", # ( ֶי )
142
- "\u05B7\u05D9": "AI", # ( ַי )
143
- "\u05B7\u05D9\u05B0": "AI", # ( ַיְ )
144
- "\u05B7\u05D9\u05B0\u202C": "AI", # ( ַיְ‬ )
145
- "\u05B8\u05D9": "AI", # ( ָי )
146
- "\u05B8\u05D9\u202C": "AI", # ( ָי‬ )
147
- "\u05B8\u05D9\u05B0": "AI", # ( ָיְ )
148
- "\u05B8\u05D9\u05B0\u202C": "AI", # ( ָיְ‬ )
149
- "\u05B9\u05D9": "OI", # ( ֹי )
150
- "\u05B9\u05D9\u05B0": "OI", # ( ֹיְ )
151
- "\u05B9\u05D9\u05B0\u202C": "OI", # ( ֹיְ‬ )
152
- "\u05BB\u05D9": "UI", # ( ֻי )
153
- "\u05BB\u05D9\u05B0": "UI", # ( ֻיְ )
154
- "\u05BB\u05D9\u05B0\u202C": "UI", # ( ֻיְ‬ )
155
- "\u05D5\u05BC\u05D9": "UI", # ( וּי )
156
- "\u05D5\u05BC\u05D9\u05B0": "UI", # ( וּיְ )
157
- "\u05D5\u05BC\u05D9\u05B0\u202C": "UI", # ( וּיְ‬ )
134
+ "\u05B5\u05D9": "EI" # ( ֵי )
135
+ "\u05B6\u05D9": "EI" # ( ֶי )
136
+ "\u05B7\u05D9": "AI" # ( ַי )
137
+ "\u05B7\u05D9\u05B0": "AI" # ( ַיְ )
138
+ "\u05B7\u05D9\u05B0\u202C": "AI" # ( ַיְ‬ )
139
+ "\u05B8\u05D9": "AI" # ( ָי )
140
+ "\u05B8\u05D9\u202C": "AI" # ( ָי‬ )
141
+ "\u05B8\u05D9\u05B0": "AI" # ( ָיְ )
142
+ "\u05B8\u05D9\u05B0\u202C": "AI" # ( ָיְ‬ )
143
+ "\u05B9\u05D9": "OI" # ( ֹי )
144
+ "\u05B9\u05D9\u05B0": "OI" # ( ֹיְ )
145
+ "\u05B9\u05D9\u05B0\u202C": "OI" # ( ֹיְ‬ )
146
+ "\u05BB\u05D9": "UI" # ( ֻי )
147
+ "\u05BB\u05D9\u05B0": "UI" # ( ֻיְ )
148
+ "\u05BB\u05D9\u05B0\u202C": "UI" # ( ֻיְ‬ )
149
+ "\u05D5\u05BC\u05D9": "UI" # ( וּי )
150
+ "\u05D5\u05BC\u05D9\u05B0": "UI" # ( וּיְ )
151
+ "\u05D5\u05BC\u05D9\u05B0\u202C": "UI" # ( וּיְ‬ )