interscript-maps 2.2.0 → 2.2.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (192) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +300 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  18. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  19. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  21. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  23. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  25. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
  26. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
  27. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  29. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  30. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  31. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  32. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  33. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  34. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  35. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  36. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  37. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  38. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  39. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  40. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  41. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  42. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  43. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  45. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  46. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  47. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  48. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  49. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  50. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  51. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  52. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  53. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  54. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  55. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  56. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  57. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  58. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  59. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  60. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  61. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  62. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  63. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  64. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  65. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  67. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  68. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  69. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  70. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  71. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  72. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  73. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  74. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  75. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  76. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  77. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  78. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  79. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  80. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  81. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  82. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  83. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  84. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
  85. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
  86. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  87. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  88. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  89. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  90. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  91. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  92. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  93. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  94. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  95. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  96. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  97. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  98. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  99. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  100. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  101. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  102. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  103. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  104. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  105. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  106. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  107. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  108. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  109. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  110. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  111. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  112. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  113. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  114. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  115. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  116. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  117. data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
  118. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  119. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
  120. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  121. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  122. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  123. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  124. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  125. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  126. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  127. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  128. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  129. data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
  130. data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
  131. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  132. data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
  133. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  134. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
  135. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
  136. data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
  137. data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
  138. data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
  139. data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
  140. data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
  141. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  142. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  143. data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
  144. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  145. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  146. data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
  147. data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
  148. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
  149. data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
  150. data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
  151. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  152. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  153. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
  154. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  155. data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
  156. data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
  157. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
  158. data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
  159. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  160. data/maps/un-ara-Arab-Latn-1971.imp +5 -5
  161. data/maps/un-ara-Arab-Latn-1972.imp +4 -4
  162. data/maps/un-ara-Arab-Latn-2017.imp +15 -15
  163. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  164. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  165. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  166. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  167. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  168. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  169. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  170. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  171. data/maps/un-hin-Deva-Latn-2016.imp +1 -1
  172. data/maps/un-kan-Kana-Latn-2016.imp +1 -1
  173. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  174. data/maps/un-mar-Deva-Latn-2016.imp +1 -1
  175. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  176. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  177. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  178. data/maps/un-nep-Deva-Latn-1972.imp +1 -1
  179. data/maps/un-nep-Deva-Latn-2013.imp +1 -1
  180. data/maps/un-ori-Orya-Latn-1972.imp +1 -1
  181. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  182. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  183. data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
  184. data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
  185. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  186. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  187. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  188. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  189. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  190. data/maps/un-urd-Arab-Latn-1972.imp +15 -15
  191. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  192. metadata +7 -1
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ron
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: CYRILLIC - ROMAN BGN/PCGN 2002 Agreement
7
+ name: Table of Correspondences for Moldovan (Cyrillic-Roman) (2002 Agreement)
8
8
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816780/TABLE_OF_CORRESPONDENCES_FOR_MOLDOVAN.pdf
9
9
  creation_date: 2002
10
10
  confirmation_date: 2019
@@ -14,7 +14,7 @@ metadata {
14
14
  and the current Roman alphabet. When Moldovan Roman-alphabet spellings are not available, this table
15
15
  can be used to convert Moldovan Cyrillic spellings. It should be noted that Moldovan is little used as a
16
16
  language label now, and is usually considered as Romanian.
17
-
17
+
18
18
  notes:
19
19
  - | # 1
20
20
  This Roman-script form is used before e, i and iu.
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:rue
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF RUSYN, BGN/PCGN 2016 System
7
+ name: Romanization of Rusyn (2016)
8
8
  url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20RUSYN.pdf
9
9
  creation_date: 2016
10
10
  confirmation_date: 2017
@@ -14,17 +14,17 @@ metadata {
14
14
  The Rusyn alphabet is almost identical to the Ukrainian alphabet, but contains three characters not
15
15
  present in the Ukrainian alphabet: ё, ы, and ъ. These letters are also absent from the alphabet used by
16
16
  Pannonian Rusyn. This table applies to both dialects of Rusyn.
17
-
17
+
18
18
  notes:
19
19
  - |
20
20
  The letters ё, ы, and ъ are present in the orthography of the Carpatho‐Rusyn variant of the Rusyn
21
21
  language. This variant is predominant among Rusyn speakers in Ukraine, Poland, Slovakia, Hungary, and
22
22
  Romania. The letters are absent from the orthography of Pannonian Rusyn, which is predominant in
23
23
  Serbia and Croatia.
24
-
24
+
25
25
  - |
26
26
  Unicode for Latin‐script characters: Ž/ž (017D, 017E); Č/č (010C, 010D); Š/š (0160, 0161); ’ (0027).
27
-
27
+
28
28
  - |
29
29
  The Romanization columns show only lowercase forms but, when romanizing, uppercase and
30
30
  lowercase Roman letters as appropriate should be used.
@@ -91,7 +91,7 @@ stage {
91
91
  sub "Я", "Ya" # Я
92
92
  sub "Ь", "'" # Ь => '
93
93
  sub "Ъ", "'" # Ъ => '
94
-
94
+
95
95
  sub "а", "a" # а
96
96
  sub "б", "b" # б
97
97
  sub "в", "v" # в
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:rus
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF RUSSIAN, BGN/PCGN 1947 System
7
+ name: Romanization of Russian (1947)
8
8
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/807920/ROMANIZATION_OF_RUSSIAN.pdf
9
9
  creation_date: 1947
10
10
  confirmation_date: 2019-06
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:sme
5
5
  source_script: Latn
6
6
  destination_script: Latn
7
- name: BGN/PCGN Northern Sami (North Lappish) 1984 Roman-Script Spelling Convention Agreement
7
+ name: Roman-Script Spelling Convention of Northern Sami (North Lappish) (1984 Agreement)
8
8
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693794/ROMAN-SCRIPT_SPELLING_CONVENTIONS.pdf
9
9
  creation_date: 1984
10
10
 
@@ -4,15 +4,17 @@ metadata {
4
4
  language: iso-639-2:srp
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: TRANSLITERATION OF SERBIAN CYRILLIC
7
+ name: Transliteration of Serbian Cyrillic
8
8
  creation_date: 1962
9
9
  confirmation_date: 1962
10
10
  description: |
11
11
  Serbo-Croatian, the official national language of Yugoslavia, is a single literary language.
12
+
12
13
  In Serbian areas it is written in the cyrillic (Serbian) alphabet, while in Croatian areas it is
13
14
  written in the roman (Croatian) alphabet.
14
- Both the BGN and PCGN use the standard Croation equivalents for fomanizing the Serbian cyrillic
15
- alphabet whenether romanized names are not available.
15
+
16
+ Both the BGN and PCGN use the standard Croatian equivalents for formalizing the Serbian cyrillic
17
+ alphabet whenever romanized names are not available.
16
18
 
17
19
  notes:
18
20
  - The digraph dj(Dj) will occasionally be found as the Croatian equivalent of ђ(Ђ),
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:srp
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF SERBIAN, BGN/PCGN 2005 System
7
+ name: Table of Correspondences for Serbian (Cyrillic-Roman) (2005 Agreement)
8
8
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816783/TABLE_OF_CORRESPONDENCES_FOR_SERBIAN.pdf
9
9
  creation_date: 2005
10
10
  confirmation_date: 2019-06
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tat
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: TATAR TABLE OF CORRESPONDENCES CYRILLIC - ROMAN BGN/PCGN 2007 Agreement
7
+ name: Table of Correspondences for Tatar (Cyrillic-Roman) (2007 Agreement)
8
8
  url: https://geonames.nga.mil/gns/html/Romanization/TABLE%20OF%20CORRESPONDENCES%20FOR%20TATAR.pdf
9
9
  creation_date: 2007
10
10
  confirmation_date: 2017-11
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tgk
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: BGN/PCGN Romanization System -- Tajik (1994)
7
+ name: Romanization of Tajik (1994)
8
8
  url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20TAJIK.pdf
9
9
  creation_date: 1994
10
10
  confirmation_date: 2017-11
@@ -0,0 +1,511 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 2007
4
+ language: iso-639-2:tir
5
+ source_script: Ethi
6
+ destination_script: Latn
7
+ name: Romanization of Tigrinya (2007)
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693783/ROMANIZATION_OF_TIGRINYA.pdf
9
+ creation_date: 2007
10
+ description: |
11
+ The BGN/PCGN system for Tigrinya is designed for use in romanizing
12
+ geographical names written in Tigrinya (Ge’ez) characters. The Roman letters
13
+ and letter combinations shown as ek’uivalents to the Tigrinya characters
14
+ reflect modern Tigrinya pronunciation, while taking into account some
15
+ conscious archaisms based on Ge’ez and liturgical practices.
16
+
17
+ notes:
18
+ - |
19
+ Where consonant character sequences give rise to the romanizations
20
+ k-h, n-y, z-h and s-h, a hyphen may be added between them to differentiate
21
+ those romanizations from the digraphs kh, ny, zh and sh.
22
+
23
+ - |
24
+ Where possible, consonant gemination should be reflected. Though not
25
+ evident from the Ge’ez script, this may be ascertained from a reference
26
+ source, such as the Tigrinya-English dictionary, Thomas Leiper Kane,
27
+ Dunwoody Press, Springfield, VA, 2000.
28
+
29
+ - |
30
+ An inventory of letter-diacritic combinations, with their Unicode
31
+ encoding, in addition to the unmodified letters of the basic Roman script
32
+ is:
33
+ All apostrophes appearing in romanization are U+2019, except as they
34
+ appear in row 21, which are U+2018.
35
+ Ĭ (U+012C) ĭ (U+012D)
36
+ Ḥ (U+0048+0323) ḥ (U+0068+0323)
37
+
38
+ - |
39
+ The Romanization column shows only lowercase forms but, when
40
+ romanizing, uppercase and lowercase Roman letters as appropriate should be
41
+ used.
42
+
43
+ - |
44
+ Table footnote 1. The 6th-order characters should be romanized either with
45
+ or without the letter ĭ, depending on pronunciation.
46
+
47
+ - |
48
+ Table footnote 2. Forms of the consonant character ሠ are understood to be
49
+ becoming obsolete in Tigrinya.
50
+
51
+ - |
52
+ Table footnote 3. The vowel characters in row 17 should be romanized with
53
+ the apostrophe unless appearing as a word-initial.
54
+
55
+ - |
56
+ Table footnote 4. Forms of the character አ are understood to be falling into
57
+ disuse in Tigrinya.
58
+ }
59
+
60
+ tests {
61
+ test "የዜግነት ክብር በ ኢትዮጵያችን ጸንቶ", "yeziegĭnetĭ kĭbĭrĭ be ’itĭyop’ĭyachĭnĭ ts’enĭto"
62
+ test "ታየ ሕዝባዊነት ዳር እስከዳር በርቶ", "taye ḥĭzĭbawinetĭ darĭ ’ĭsĭkedarĭ berĭto"
63
+ test "ለሰላም ለፍትህ ለሕዝቦች ነጻነት", "leselamĭ lefĭtĭhĭ leḥĭzĭbochĭ nets’anetĭ"
64
+ test "በእኩልነት በፍቅር ቆመናል ባንድነት", "be’ĭkulĭnetĭ befĭk’ĭrĭ k’omenalĭ banĭdĭnetĭ"
65
+ test "መሠረተ ፅኑ ሰብዕናን ያልሻርን", "meserete ts’ĭnu sebĭ‘ĭnanĭ yalĭsharĭnĭ"
66
+ test "ሕዝቦች ነን ለሥራ በሥራ የኖርን", "ḥĭzĭbochĭ nenĭ lesĭra besĭra yenorĭnĭ"
67
+ test "ድንቅ የባህል መድረክ ያኩሪ ቅርስ ባለቤት", "dĭnĭk’ĭ yebahĭlĭ medĭrekĭ yakuri k’ĭrĭsĭ balebietĭ"
68
+ test "የተፈጥሮ ጸጋ የጀግና ሕዝብ እናት", "yetefet’ĭro ts’ega yejegĭna ḥĭzĭbĭ ’ĭnatĭ"
69
+ test "እንጠብቅሻለን አለብን አደራ", "’ĭnĭt’ebĭk’ĭshalenĭ ’elebĭnĭ ’edera"
70
+ test "ኢትዮጵያችን ኑሪ እኛም ባንቺ እንኩራ", "’itĭyop’ĭyachĭnĭ nuri ’ĭnyamĭ banĭchi ’ĭnĭkura"
71
+ test "ቋንቋ የድምጽ, የምልክት ወይም የምስል ቅንብር ሆኖ", "k’wanĭk’wa yedĭmĭts’ĭ, yemĭlĭkĭtĭ weyĭmĭ yemĭsĭlĭ k’ĭnĭbĭrĭ hono"
72
+ test "ለማሰብ ወይም የታሰበን ሃሳብ ለሌላ ለማስተላለፍ የሚረዳ መሳሪያ ነው", "lemasebĭ weyĭmĭ yetasebenĭ hasabĭ leliela lemasĭtelalefĭ yemireda mesariya newĭ"
73
+ test "በአጭሩ ቋንቋ የምልክቶች ስርዓትና እኒህን ምልክቶች ለማቀናበር", "be’ech’ĭru k’wanĭk’wa yemĭlĭkĭtochĭ sĭrĭ‘atĭna ’ĭnihĭnĭ mĭlĭkĭtochĭ lemak’enaberĭ"
74
+ test "የሚያስፈልጉ ህጎች ጥንቅር ነው. ቋንቋወችን ለመፈረጅ እንዲሁም", "yemiyasĭfelĭgu hĭgochĭ t’ĭnĭk’ĭrĭ newĭ. k’wanĭk’wawechĭnĭ lemeferejĭ ’ĭnĭdihumĭ"
75
+ test "ለምክፈል የሚያስችሉ መስፈርቶችን ለማስቀመጥ ባለው ችግር", "lemĭkĭfelĭ yemiyasĭchĭlu mesĭferĭtochĭnĭ lemasĭk’emet’ĭ balewĭ chĭgĭrĭ"
76
+ test "ምክንያት በአሁኑ ሰዓት በርግጠኝነት ስንት ቋንቋ በዓለም ላይ", "mĭkĭnĭyatĭ be’ehunu se‘atĭ berĭgĭt’enyĭnetĭ sĭnĭtĭ k’wanĭk’wa be‘alemĭ layĭ"
77
+ test "እንዳለ ማወቅ አስቸጋሪ ነው", "’ĭnĭdale mawek’ĭ ’esĭchegari newĭ"
78
+ test "አሰላ", "’esela"
79
+ test "አሶሳ", "’esosa"
80
+ test "አንኮበር", "’enĭkoberĭ"
81
+ test "አክሱም", "’ekĭsumĭ"
82
+ test "አዋሳ", "’ewasa"
83
+ test "አዲስ ዘመን (ከተማ)", "’edisĭ zemenĭ (ketema)"
84
+ test "አዲግራት", "’edigĭratĭ"
85
+ test "አዳማ", "’edama"
86
+ test "ደምበጫ", "demĭbech’a"
87
+ test "ደርባ", "derĭba"
88
+ test "ደብረ ማርቆስ", "debĭre marĭk’osĭ"
89
+ test "ደብረ ብርሃን", "debĭre bĭrĭhanĭ"
90
+ test "ደብረ ታቦር (ከተማ)", "debĭre taborĭ (ketema)"
91
+ test "ደብረ ዘይት", "debĭre zeyĭtĭ"
92
+ test "ደገሃቡር", "degehaburĭ"
93
+ test "ወልቂጤ", "welĭk’it’ie"
94
+ test "ወልወል", "welĭwelĭ"
95
+ test "ወልደያ", "welĭdeya"
96
+ test "ናይሎ ሳህራን", "nayĭlo sahĭranĭ"
97
+ test "አኙዋክኛ", "’enyuwakĭnya"
98
+ test "ኡዱክኛ", "’udukĭnya"
99
+ test "ኦፓኛ", "’opanya"
100
+ test "ጉምዝኛ", "gumĭzĭnya"
101
+ test "አፋርኛ", "’efarĭnya"
102
+ test "አላባኛ", "’elabanya"
103
+ test "አርቦርኛ", "’erĭborĭnya"
104
+ test "ባይሶኛ", "bayĭsonya"
105
+ test "ቡሳኛ", "busanya"
106
+ test "ሁለተኛ ጥፋት ከገበያ ማንቀላፋት", "huletenya t’ĭfatĭ kegebeya manĭk’elafatĭ"
107
+ test "ሁሉም ከልኩ አያልፍም", "hulumĭ kelĭku ’eyalĭfĭmĭ"
108
+ test "አልሞት ባይ ተጋዳይ", "’elĭmotĭ bayĭ tegadayĭ"
109
+ test "ውርድ ከራሴ", "wĭrĭdĭ kerasie"
110
+ test "ፀጉር መሰንጠቅ", "ts’egurĭ mesenĭt’ek’ĭ"
111
+ test "ግንትር ፀሐይ", "gĭnĭtĭrĭ ts’eḥeyĭ"
112
+ test "በሬ ወለደ", "berie welede"
113
+ test "ራስ ሳይጠና ጉተና", "rasĭ sayĭt’ena gutena"
114
+ test "ለሆዴ ጠግቤ በልብሴ አንግቤ", "lehodie t’egĭbie belĭbĭsie ’enĭgĭbie"
115
+ test "ለልጅ ከሳቁለት ለውሻ ከሮጡለት", "lelĭjĭ kesak’uletĭ lewĭsha kerot’uletĭ"
116
+ test "መልካም ባል መጥፎ ሴት ይገራል", "melĭkamĭ balĭ met’ĭfo sietĭ yĭgeralĭ"
117
+ test "ሆድና ግንባር አይሸሸግም", "hodĭna gĭnĭbarĭ ’eyĭsheshegĭmĭ"
118
+ test "ቀሊል አማት ሲሶ በትር አላት", "k’elilĭ ’ematĭ siso betĭrĭ ’elatĭ"
119
+ test "ጨው ለራስህ ብለህ ጣፍጥ አለበለዚያ ድንጋይ ነው ብለው ይወረውሩሀል", "ch’ewĭ lerasĭhĭ bĭlehĭ t’afĭt’ĭ ’elebeleziya dĭnĭgayĭ newĭ bĭlewĭ yĭwerewĭruhelĭ"
120
+ test "ጀምሮ ይጨርሳል አልሞ ይተኩሳል", "jemĭro yĭch’erĭsalĭ ’elĭmo yĭtekusalĭ"
121
+ }
122
+
123
+ stage {
124
+
125
+ # CHARACTERS
126
+ parallel {
127
+ sub "\u1200", "he" # ሀ
128
+ sub "\u1201", "hu" # ሁ
129
+ sub "\u1202", "hi" # ሂ
130
+ sub "\u1203", "ha" # ሃ
131
+ sub "\u1204", "hie" # ሄ
132
+ sub "\u1205", any(["hĭ", "h"]) # ህ
133
+ sub "\u1206", "ho" # ሆ
134
+
135
+ sub "\u1208", "le" # ለ
136
+ sub "\u1209", "lu" # ሉ
137
+ sub "\u120A", "li" # ሊ
138
+ sub "\u120B", "la" # ላ
139
+ sub "\u120C", "lie" # ሌ
140
+ sub "\u120D", any(["lĭ", "l"]) # ል
141
+ sub "\u120E", "lo" # ሎ
142
+
143
+ sub "\u1210", "ḥe" # ሐ
144
+ sub "\u1211", "ḥu" # ሑ
145
+ sub "\u1212", "ḥi" # ሒ
146
+ sub "\u1213", "ḥa" # ሓ
147
+ sub "\u1214", "ḥie" # ሔ
148
+ sub "\u1215", any(["ḥĭ", "ḥ"]) # ሕ
149
+ sub "\u1216", "ḥo" # ሖ
150
+
151
+ sub "\u1218", "me" # መ
152
+ sub "\u1219", "mu" # ሙ
153
+ sub "\u121A", "mi" # ሚ
154
+ sub "\u121B", "ma" # ማ
155
+ sub "\u121C", "mie" # ሜ
156
+ sub "\u121D", any(["mĭ", "m"]) # ም
157
+ sub "\u121E", "mo" # ሞ
158
+
159
+ # TODO: NOTE 2:
160
+ # Where possible, consonant gemination should be reflected. Though not
161
+ # evident from the Ge’ez script, this may be ascertained from a reference
162
+ # source, such as the Tigrinya-English dictionary, Thomas Leiper Kane,
163
+ # Dunwoody Press, Springfield, VA, 2000.
164
+ sub "\u1220", "se" # ሠ
165
+ sub "\u1221", "su" # ሡ
166
+ sub "\u1222", "si" # ሢ
167
+ sub "\u1223", "sa" # ሣ
168
+ sub "\u1224", "sie" # ሤ
169
+ sub "\u1225", any(["sĭ", "s"]) # ሥ
170
+ sub "\u1226", "so" # ሦ
171
+
172
+ sub "\u1228", "re" # ረ
173
+ sub "\u1229", "ru" # ሩ
174
+ sub "\u122A", "ri" # ሪ
175
+ sub "\u122B", "ra" # ራ
176
+ sub "\u122C", "rie" # ሬ
177
+ sub "\u122D", any(["rĭ", "r"]) # ር
178
+ sub "\u122E", "ro" # ሮ
179
+
180
+ sub "\u1230", "se" # ሰ
181
+ sub "\u1231", "su" # ሱ
182
+ sub "\u1232", "si" # ሲ
183
+ sub "\u1233", "sa" # ሳ
184
+ sub "\u1234", "sie" # ሴ
185
+ sub "\u1235", any(["sĭ", "s"]) # ስ
186
+ sub "\u1236", "so" # ሶ
187
+
188
+ sub "\u1238", "she" # ሸ
189
+ sub "\u1239", "shu" # ሹ
190
+ sub "\u123A", "shi" # ሺ
191
+ sub "\u123B", "sha" # ሻ
192
+ sub "\u123C", "shie" # ሼ
193
+ sub "\u123D", any(["shĭ", "sh"]) # ሽ
194
+ sub "\u123E", "sho" # ሾ
195
+
196
+ sub "\u1240", "k’e" # ቀ
197
+ sub "\u1241", "k’u" # ቁ
198
+ sub "\u1242", "k’i" # ቂ
199
+ sub "\u1243", "k’a" # ቃ
200
+ sub "\u1244", "k’ie" # ቄ
201
+ sub "\u1245", any(["k’ĭ", "k’"]) # ቅ
202
+ sub "\u1246", "k’o" # ቆ
203
+
204
+ sub "\u1250", "kh’e" # ቐ
205
+ sub "\u1251", "kh’u" # ቑ
206
+ sub "\u1252", "kh’i" # ቒ
207
+ sub "\u1253", "kh’a" # ቓ
208
+ sub "\u1254", "kh’ie" # ቔ
209
+ sub "\u1255", any(["kh’ĭ", "kh’"]) # ቕ
210
+ sub "\u1256", "kh’o" # ቖ
211
+
212
+ sub "\u1260", "be" # በ
213
+ sub "\u1261", "bu" # ቡ
214
+ sub "\u1262", "bi" # ቢ
215
+ sub "\u1263", "ba" # ባ
216
+ sub "\u1264", "bie" # ቤ
217
+ sub "\u1265", any(["bĭ", "b"]) # ብ
218
+ sub "\u1266", "bo" # ቦ
219
+
220
+ sub "\u1270", "te" # ተ
221
+ sub "\u1271", "tu" # ቱ
222
+ sub "\u1272", "ti" # ቲ
223
+ sub "\u1273", "ta" # ታ
224
+ sub "\u1274", "tie" # ቴ
225
+ sub "\u1275", any(["tĭ", "t"]) # ት
226
+ sub "\u1276", "to" # ቶ
227
+
228
+ sub "\u1278", "che" # ቸ
229
+ sub "\u1279", "chu" # ቹ
230
+ sub "\u127A", "chi" # ቺ
231
+ sub "\u127B", "cha" # ቻ
232
+ sub "\u127C", "chie" # ቼ
233
+ sub "\u127D", any(["chĭ", "ch"]) # ች
234
+ sub "\u127E", "cho" # ቾ
235
+
236
+ sub "\u1280", "ḥe" # ኀ
237
+ sub "\u1281", "ḥu" # ኁ
238
+ sub "\u1282", "ḥi" # ኂ
239
+ sub "\u1283", "ḥa" # ኃ
240
+ sub "\u1284", "ḥie" # ኄ
241
+ sub "\u1285", any(["ḥĭ", "ḥ"]) # ኅ
242
+ sub "\u1286", "ḥo" # ኆ
243
+
244
+ sub "\u1290", "ne" # ነ
245
+ sub "\u1291", "nu" # ኑ
246
+ sub "\u1292", "ni" # ኒ
247
+ sub "\u1293", "na" # ና
248
+ sub "\u1294", "nie" # ኔ
249
+ sub "\u1295", any(["nĭ", "n"]) # ን
250
+ sub "\u1296", "no" # ኖ
251
+
252
+ sub "\u1298", "nye" # ኘ
253
+ sub "\u1299", "nyu" # ኙ
254
+ sub "\u129A", "nyi" # ኚ
255
+ sub "\u129B", "nya" # ኛ
256
+ sub "\u129C", "nyie" # ኜ
257
+ sub "\u129D", any(["nyĭ", "ny"]) # ኝ
258
+ sub "\u129E", "nyo" # ኞ
259
+
260
+ # NOTE 3 The vowel characters in row 17 should be romanized with the
261
+ # apostrophe unless appearing as a word-initial.
262
+ # NOTE 4 Forms of the character አ are understood to be falling into disuse
263
+ # in Tigrinya.
264
+ sub "\u12A0", "’e" # አ
265
+ sub "\u12A1", "’u" # ኡ
266
+ sub "\u12A2", "’i" # ኢ
267
+ sub "\u12A3", "’a" # ኣ
268
+ sub "\u12A4", "’ie" # ኤ
269
+ sub "\u12A5", any(["’ĭ", "ĭ"]) # እ
270
+ sub "\u12A6", "’o" # ኦ
271
+
272
+ sub "\u12A8", "ke" # ከ
273
+ sub "\u12A9", "ku" # ኩ
274
+ sub "\u12AA", "ki" # ኪ
275
+ sub "\u12AB", "ka" # ካ
276
+ sub "\u12AC", "kie" # ኬ
277
+ sub "\u12AD", any(["kĭ", "k"]) # ክ
278
+ sub "\u12AE", "ko" # ኮ
279
+
280
+ sub "\u12B8", "khe" # ኸ
281
+ sub "\u12B9", "khu" # ኹ
282
+ sub "\u12BA", "khi" # ኺ
283
+ sub "\u12BB", "kha" # ኻ
284
+ sub "\u12BC", "khie" # ኼ
285
+ sub "\u12BD", any(["khĭ", "kh"]) # ኽ
286
+ sub "\u12BE", "kho" # ኾ
287
+
288
+ sub "\u12C8", "we" # ወ
289
+ sub "\u12C9", "wu" # ዉ
290
+ sub "\u12CA", "wi" # ዊ
291
+ sub "\u12CB", "wa" # ዋ
292
+ sub "\u12CC", "wie" # ዌ
293
+ sub "\u12CD", any(["wĭ", "w"]) # ው
294
+ sub "\u12CE", "wo" # ዎ
295
+
296
+ sub "\u12D0", "‘e" # ዐ
297
+ sub "\u12D1", "‘u" # ዑ
298
+ sub "\u12D2", "‘i" # ዒ
299
+ sub "\u12D3", "‘a" # ዓ
300
+ sub "\u12D4", "‘ie" # ዔ
301
+ sub "\u12D5", any(["‘ĭ", "‘"]) # ዕ
302
+ sub "\u12D6", "‘o" # ዖ
303
+
304
+ sub "\u12D8", "ze" # ዘ
305
+ sub "\u12D9", "zu" # ዙ
306
+ sub "\u12DA", "zi" # ዚ
307
+ sub "\u12DB", "za" # ዛ
308
+ sub "\u12DC", "zie" # ዜ
309
+ sub "\u12DD", any(["zĭ", "z"]) # ዝ
310
+ sub "\u12DE", "zo" # ዞ
311
+
312
+ sub "\u12E0", "zhe" # ዠ
313
+ sub "\u12E1", "zhu" # ዡ
314
+ sub "\u12E2", "zhi" # ዢ
315
+ sub "\u12E3", "zha" # ዣ
316
+ sub "\u12E4", "zhie" # ዤ
317
+ sub "\u12E5", any(["zhĭ", "zh"]) # ዥ
318
+ sub "\u12E6", "zho" # ዦ
319
+
320
+ sub "\u12E8", "ye" # የ
321
+ sub "\u12E9", "yu" # ዩ
322
+ sub "\u12EA", "yi" # ዪ
323
+ sub "\u12EB", "ya" # ያ
324
+ sub "\u12EC", "yie" # ዬ
325
+ sub "\u12ED", any(["yĭ", "y"]) # ይ
326
+ sub "\u12EE", "yo" # ዮ
327
+
328
+ sub "\u12F0", "de" # ደ
329
+ sub "\u12F1", "du" # ዱ
330
+ sub "\u12F2", "di" # ዲ
331
+ sub "\u12F3", "da" # ዳ
332
+ sub "\u12F4", "die" # ዴ
333
+ sub "\u12F5", any(["dĭ", "d"]) # ድ
334
+ sub "\u12F6", "do" # ዶ
335
+
336
+ sub "\u1300", "je" # ጀ
337
+ sub "\u1301", "ju" # ጁ
338
+ sub "\u1302", "ji" # ጂ
339
+ sub "\u1303", "ja" # ጃ
340
+ sub "\u1304", "jie" # ጄ
341
+ sub "\u1305", any(["jĭ", "j"]) # ጅ
342
+ sub "\u1306", "jo" # ጆ
343
+
344
+ sub "\u1308", "ge" # ገ
345
+ sub "\u1309", "gu" # ጉ
346
+ sub "\u130A", "gi" # ጊ
347
+ sub "\u130B", "ga" # ጋ
348
+ sub "\u130C", "gie" # ጌ
349
+ sub "\u130D", any(["gĭ", "g"]) # ግ
350
+ sub "\u130E", "go" # ጎ
351
+
352
+ sub "\u1320", "t’e" # ጠ
353
+ sub "\u1321", "t’u" # ጡ
354
+ sub "\u1322", "t’i" # ጢ
355
+ sub "\u1323", "t’a" # ጣ
356
+ sub "\u1324", "t’ie" # ጤ
357
+ sub "\u1325", any(["t’ĭ", "t’"]) # ጥ
358
+ sub "\u1326", "t’o" # ጦ
359
+
360
+ sub "\u1328", "ch’e" # ጨ
361
+ sub "\u1329", "ch’u" # ጩ
362
+ sub "\u132A", "ch’i" # ጪ
363
+ sub "\u132B", "ch’a" # ጫ
364
+ sub "\u132C", "ch’ie" # ጬ
365
+ sub "\u132D", any(["ch’ĭ", "ch’"]) # ጭ
366
+ sub "\u132E", "ch’o" # ጮ
367
+
368
+ sub "\u1330", "p’e" # ጰ
369
+ sub "\u1331", "p’u" # ጱ
370
+ sub "\u1332", "p’i" # ጲ
371
+ sub "\u1333", "p’a" # ጳ
372
+ sub "\u1334", "p’ie" # ጴ
373
+ sub "\u1335", any(["p’ĭ", "p’"]) # ጵ
374
+ sub "\u1336", "p’o" # ጶ
375
+
376
+ sub "\u1338", "ts’e" # ጸ
377
+ sub "\u1339", "ts’u" # ጹ
378
+ sub "\u133A", "ts’i" # ጺ
379
+ sub "\u133B", "ts’a" # ጻ
380
+ sub "\u133C", "ts’ie" # ጼ
381
+ sub "\u133D", any(["ts’ĭ", "ts’"]) # ጽ
382
+ sub "\u133E", "ts’o" # ጾ
383
+
384
+ sub "\u1340", "ts’e" # ፀ
385
+ sub "\u1341", "ts’u" # ፁ
386
+ sub "\u1342", "ts’i" # ፂ
387
+ sub "\u1343", "ts’a" # ፃ
388
+ sub "\u1344", "ts’ie" # ፄ
389
+ sub "\u1345", any(["ts’ĭ", "ts’"]) # ፅ
390
+ sub "\u1346", "ts’o" # ፆ
391
+
392
+ sub "\u1348", "fe" # ፈ
393
+ sub "\u1349", "fu" # ፉ
394
+ sub "\u134A", "fi" # ፊ
395
+ sub "\u134B", "fa" # ፋ
396
+ sub "\u134C", "fie" # ፌ
397
+ sub "\u134D", any(["fĭ", "f"]) # ፍ
398
+ sub "\u134E", "fo" # ፎ
399
+
400
+ sub "\u1350", "pe" # ፐ
401
+ sub "\u1351", "pu" # ፑ
402
+ sub "\u1352", "pi" # ፒ
403
+ sub "\u1353", "pa" # ፓ
404
+ sub "\u1354", "pie" # ፔ
405
+ sub "\u1355", any(["pĭ", "p"]) # ፕ
406
+ sub "\u1356", "po" # ፖ
407
+
408
+ sub "\u1268", "ve" # ቨ
409
+ sub "\u1269", "vu" # ቩ
410
+ sub "\u126A", "vi" # ቪ
411
+ sub "\u126B", "va" # ቫ
412
+ sub "\u126C", "vie" # ቬ
413
+ sub "\u126D", any(["vĭ", "v"]) # ቭ
414
+ sub "\u126E", "vo" # ቮ
415
+
416
+ # Combinations with W (Labialized Consonants)
417
+
418
+ sub "\u1248", "k’we" # ቈ
419
+ sub "\u124a", "k’wi" # ቊ
420
+ sub "\u124b", "k’wa" # ቋ
421
+ sub "\u124c", "k’wie" # ቌ
422
+ sub "\u124d", any(["k’wĭ", "k’w"]) # ቍ
423
+
424
+ sub "\u1288", "ḥwe" # ኈ
425
+ sub "\u128a", "ḥwi" # ኊ
426
+ sub "\u128b", "ḥwa" # ኋ
427
+ sub "\u128c", "ḥwie" # ኌ
428
+ sub "\u128d", any(["ḥwĭ", "ḥw"]) # ኍ
429
+
430
+ sub "\u12b0", "kwe" # ኰ
431
+ sub "\u12b2", "kwi" # ኲ
432
+ sub "\u12b3", "kwa" # ኳ
433
+ sub "\u12b4", "kwie" # ኴ
434
+ sub "\u12b5", any(["kwĭ", "kw"]) # ኵ
435
+
436
+ sub "\u1310", "gwe" # ጐ
437
+ sub "\u1312", "gwi" # ጒ
438
+ sub "\u1313", "gwa" # ጓ
439
+ sub "\u1314", "gwie" # ጔ
440
+ sub "\u1315", any(["gwĭ", "gw"]) # ጕ
441
+
442
+ sub "\u12c0", "khwe" # ዀ
443
+ sub "\u12c2", "khwi" # ዂ
444
+ sub "\u12c3", "khwa" # ዃ
445
+ sub "\u12c4", "khwie" # ዄ
446
+ sub "\u12c5", any(["khwĭ", "khw"]) # ዅ
447
+
448
+ sub "\u1258", "kh’e" # ቘ
449
+ sub "\u125a", "kh’i" # ቚ
450
+ sub "\u125b", "kh’a" # ቛ
451
+ sub "\u125c", "kh’ie" # ቜ
452
+ sub "\u125d", any(["kh’ĭ", "kh’"]) # ቝ
453
+
454
+ sub "\u120f", "lwa" # ሏ
455
+ sub "\u121f", "mwa" # ሟ
456
+ sub "\u122f", "rwa" # ሯ
457
+ sub "\u1237", "swa" # ሷ
458
+ sub "\u123f", "shwa" # ሿ
459
+ sub "\u1267", "bwa" # ቧ
460
+ sub "\u1277", "twa" # ቷ
461
+ sub "\u127f", "chwa" # ቿ
462
+
463
+ sub "\u1297", "nwa" # ኗ
464
+ sub "\u129f", "nywa" # ኟ
465
+ sub "\u12df", "zwa" # ዟ
466
+ sub "\u12e7", "zhwa" # ዧ
467
+ sub "\u12f7", "dwa" # ዷ
468
+ sub "\u1307", "jwa" # ጇ
469
+ sub "\u1327", "t’wa" # ጧ
470
+ sub "\u132f", "ch’wa" # ጯ
471
+ sub "\u133f", "ts’wa" # ጿ
472
+ sub "\u134f", "fwa" # ፏ
473
+
474
+ # Numerals
475
+
476
+ sub "\u1369", "1" # ፩
477
+ sub "\u136A", "2" # ፪
478
+ sub "\u136B", "3" # ፫
479
+ sub "\u136C", "4" # ፬
480
+ sub "\u136D", "5" # ፭
481
+ sub "\u136E", "6" # ፮
482
+ sub "\u136F", "7" # ፯
483
+ sub "\u1370", "8" # ፰
484
+ sub "\u1371", "9" # ፱
485
+ sub "\u1372", "10" # ፲
486
+ sub "\u1372\u1369", "11" # ፲፩
487
+ sub "\u1373", "20" # ፳
488
+ sub "\u1373\u1369", "21" # ፳፩
489
+ sub "\u1374", "30" # ፴
490
+ sub "\u1375", "40" # ፵
491
+ sub "\u1376", "50" # ፶
492
+ sub "\u1377", "60" # ፷
493
+ sub "\u1379", "80" # ፹
494
+ sub "\u137A", "90" # ፺
495
+ sub "\u137B", "100" # ፻
496
+
497
+ # These two rules are not defined in the sytsem.
498
+ # sub "\u1372\u137B", "1000" # ፲፻
499
+ # sub "\u137B\u137B", "10000" # ፻፻
500
+
501
+ # Punctuation
502
+
503
+ sub "፡", " " # Word Break (space)
504
+ sub "፣", "," # Comma
505
+ sub "፤", ";" # Semicolon
506
+ sub "።", "." # Period
507
+
508
+ }
509
+
510
+ }
511
+