interscript-maps 2.1.0 → 2.3.1a

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (258) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +330 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-div-Thaa-Latn-2012.imp +74 -0
  18. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  19. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  21. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  23. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  25. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  26. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -4
  27. data/maps/alalc-kat-Geok-Latn-2011.imp +31 -0
  28. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -13
  29. data/maps/alalc-kat-Geor-Latn-2011.imp +52 -0
  30. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  31. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  32. data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
  33. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  34. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  35. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  36. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  37. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  38. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  39. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  40. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  41. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  42. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  43. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  45. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  46. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  47. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  48. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  49. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  50. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  51. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  52. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  53. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  54. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  55. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  56. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  57. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  58. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  59. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  60. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  61. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  62. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  63. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
  64. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
  65. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  66. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  67. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  68. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  69. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  70. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  71. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  72. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
  73. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
  74. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  75. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  76. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
  77. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  78. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  79. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  80. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  81. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  82. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  83. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  84. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  85. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  86. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  87. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  88. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  89. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  90. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  91. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  92. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  93. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +5 -5
  94. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +5 -5
  95. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  96. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  97. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  98. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  99. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  100. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  101. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  102. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  103. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  104. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  105. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  106. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  107. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  108. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  109. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  110. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  111. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  112. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  113. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  114. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  115. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  116. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  117. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  118. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  119. data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
  120. data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
  121. data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
  122. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
  123. data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
  124. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
  125. data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
  126. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
  127. data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
  128. data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
  129. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  130. data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
  131. data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
  132. data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
  133. data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
  134. data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
  135. data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
  136. data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
  137. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  138. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
  139. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  140. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  141. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
  142. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  143. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  144. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  145. data/maps/iso-ara-Arab-Latn-233-1984.imp +15 -15
  146. data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
  147. data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
  148. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  149. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
  150. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
  151. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
  152. data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
  153. data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
  154. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
  155. data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
  156. data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
  157. data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
  158. data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
  159. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
  160. data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
  161. data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
  162. data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
  163. data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
  164. data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
  165. data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
  166. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
  167. data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
  168. data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
  169. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +16 -16
  170. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
  171. data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
  172. data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
  173. data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
  174. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  175. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  176. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  177. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  178. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  179. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  180. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  181. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  182. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  183. data/maps/odni-ara-Arab-Latn-2004.imp +1 -2
  184. data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
  185. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  186. data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
  187. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  188. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
  189. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
  190. data/maps/odni-fas-Arab-Latn-2004.imp +14 -15
  191. data/maps/odni-fas-Arab-Latn-2015.imp +17 -17
  192. data/maps/odni-hin-Deva-Latn-2004.imp +20 -21
  193. data/maps/odni-hin-Deva-Latn-2015.imp +26 -27
  194. data/maps/odni-kat-Geor-Latn-2015.imp +3 -5
  195. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  196. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  197. data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
  198. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  199. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  200. data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
  201. data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
  202. data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
  203. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
  204. data/maps/odni-srp-Cyrl-Latn-2005.imp +1 -2
  205. data/maps/odni-srp-Cyrl-Latn-2015.imp +7 -9
  206. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  207. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  208. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
  209. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  210. data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
  211. data/maps/odni-urd-Arab-Latn-2015.imp +21 -22
  212. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
  213. data/maps/ses-ara-Arab-Latn-1930.imp +17 -60
  214. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  215. data/maps/un-ara-Arab-Latn-1971.imp +6 -6
  216. data/maps/un-ara-Arab-Latn-1972.imp +5 -5
  217. data/maps/un-ara-Arab-Latn-2017.imp +16 -16
  218. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  219. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  220. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  221. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  222. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  223. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  224. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  225. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  226. data/maps/un-hin-Deva-Latn-2016.imp +2 -2
  227. data/maps/un-kan-Kana-Latn-2016.imp +2 -2
  228. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  229. data/maps/un-mar-Deva-Latn-2016.imp +2 -2
  230. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  231. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  232. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  233. data/maps/un-nep-Deva-Latn-1972.imp +2 -2
  234. data/maps/un-nep-Deva-Latn-2013.imp +2 -2
  235. data/maps/un-ori-Orya-Latn-1972.imp +2 -2
  236. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  237. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  238. data/maps/un-rus-Cyrl-Latn-1987.imp +2 -2
  239. data/maps/un-sin-Sinh-Latn-1972.imp +16 -4
  240. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  241. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  242. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  243. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  244. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  245. data/maps/un-urd-Arab-Latn-1972.imp +16 -16
  246. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  247. data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
  248. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
  249. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
  250. data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
  251. data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
  252. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
  253. data/maps/var-mon-Mong-Latn-1930.imp +1 -1
  254. data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
  255. data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
  256. data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
  257. data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
  258. metadata +13 -3
@@ -4,9 +4,9 @@ metadata {
4
4
  language: iso-639-2:zho
5
5
  source_script: Hani
6
6
  destination_script: Latn
7
- name: Chinese Tongyong Pinyin Academica Sinica 2002 System
7
+ name: Tongyong Pinyin System (2002)
8
8
  url:
9
- description: Chinese Tongyong Pinyin Academica Sinica 2002 System
9
+ description: Academia Sinica Tongyong Pinyin System (2002)
10
10
  }
11
11
 
12
12
  tests {
@@ -4,14 +4,18 @@ metadata {
4
4
  language: iso-639-2:amh
5
5
  source_script: Ethi
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Amharic (1997)
7
+ name: Romanization Table -- Amharic (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/amharic.pdf
9
9
  creation_date: 1997
10
10
  description: |
11
- ALA-LC Romanization Tables: Transliteration Schemes for Non-Roman Scripts. Randal K. Berry (ed.). Library of Congress, 1997.
12
-
11
+ ALA-LC Romanization Tables: Transliteration Schemes for Non-Roman Scripts.
12
+ Randal K. Berry (ed.). Library of Congress, 1997.
13
+
13
14
  notes:
14
- - The Ethiopic script used for Amharic is also used for other languages, including Ge’ez, Argobba, Gurage, and Tigre. Ge’ez, which is chiefly a liturgical language, uses only 26 basic letter forms from this table.
15
+ - |
16
+ The Ethiopic script used for Amharic is also used for other languages,
17
+ including Ge’ez, Argobba, Gurage, and Tigre. Ge’ez, which is chiefly a
18
+ liturgical language, uses only 26 basic letter forms from this table.
15
19
  }
16
20
 
17
21
  tests {
@@ -319,17 +323,17 @@ stage {
319
323
  sub "ቬ", "vé"
320
324
  sub "ቭ", any(["ve", "v"])
321
325
  sub "ቮ", "vo"
322
-
326
+
323
327
  sub "ቈ", "qwa"
324
328
  sub "ቊ", "qwi"
325
329
  sub "ቋ", "qwā"
326
330
  sub "ቌ", "qwé"
327
331
  sub "ቍ", "qwe"
328
- sub "ኈ", "hwa"
329
- sub "ኊ", "hwi"
330
- sub "ኋ", "hwā"
331
- sub "ኌ", "hwé"
332
- sub "ኍ", "hwe"
332
+ sub "ኈ", "ẖwa"
333
+ sub "ኊ", "ẖwi"
334
+ sub "ኋ", "ẖwā"
335
+ sub "ኌ", "ẖwé"
336
+ sub "ኍ", "ẖwe"
333
337
  sub "ኰ", "kwa"
334
338
  sub "ኲ", "kwi"
335
339
  sub "ኳ", "kwā"
@@ -340,7 +344,7 @@ stage {
340
344
  sub "ጓ", "gwā"
341
345
  sub "ጔ", "gwé"
342
346
  sub "ጕ", "gwe"
343
-
347
+
344
348
  sub "ሏ", "lwa"
345
349
  sub "ቧ", "bwa"
346
350
  sub "ዟ", "zwa"
@@ -361,12 +365,12 @@ stage {
361
365
  sub "ሿ", "šwa"
362
366
  sub "ኟ", "ñwa"
363
367
  sub "ጇ", "ǧwa"
364
-
368
+
365
369
  sub "ፙ", "mya"
366
370
  sub "ፚ", "fya"
367
-
371
+
368
372
  sub "ኧ", "ă"
369
-
373
+
370
374
  sub "፩", "1"
371
375
  sub "፪", "2"
372
376
  sub "፫", "3"
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:amh
5
5
  source_script: Ethi
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Amharic (2011)
7
+ name: Romanization Table -- Amharic (2011)
8
8
  url: https://www.loc.gov/catdir/cpso/romanization/amharic.pdf
9
9
  creation_date: 2011
10
10
  description: ''
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Arabic (1997)
7
+ name: Romanization Table -- Arabic (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/arabic.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:asm
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Assamese Romanization, 1997
7
+ name: Romanization Table -- Assamese (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/assamese.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:asm
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Assamese Romanization, 2012
7
+ name: Romanization Table -- Assamese (2012)
8
8
  url: https://www.loc.gov/catdir/cpso/romanization/assamese.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:aze
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- azerbaij (1997)
7
+ name: Romanization Table -- azerbaij (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/azerbaij.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:aze
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Azerbaijani (1997)
7
+ name: Romanization Table -- Azerbaijani (1997)
8
8
  url: https://transliteration.eki.ee/pdf/Azerbaijani.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,10 +4,10 @@ metadata {
4
4
  language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Byelorussian (1997)
7
+ name: Romanization Table -- Byelorussian (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/beloruss.pdf
9
9
  creation_date: 1997
10
-
10
+
11
11
  notes:
12
12
  - Ґ letter found in Old Belarusian and in modern publications in Tarashkevitsa orthography.
13
13
  - Do not confuse with the digraph кг (also romanized as “kh”). Manual review may be needed when transcribing data in vernacular characters in order to distinguish х from кг.
@@ -43,7 +43,7 @@ stage {
43
43
  sub "\u00B4", "" # official english Apostrophe
44
44
  sub "\u02BC", ""
45
45
  sub "\u0027", "" # from belarussian keyboard
46
-
46
+
47
47
  # Characters
48
48
  sub "\u0410", "A" # A
49
49
  sub "\u0411", "B" # Б
@@ -78,7 +78,7 @@ stage {
78
78
  sub "\u042D", "Ė" # Э : Ė
79
79
  sub "\u042E", "I͡U" # Ю : I͡U
80
80
  sub "\u042F", "I͡A" # Я : I͡A
81
-
81
+
82
82
  sub "\u0430", "a" # а
83
83
  sub "\u0431", "b" # б
84
84
  sub "\u0432", "v" # в
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: Bengali Romanization, 1997
7
+ name: Romanization Table -- Bengali (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/bengali.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ben
5
5
  source_script: Beng
6
6
  destination_script: Latn
7
- name: Bengali Romanization, 2017
7
+ name: Romanization Table -- Bengali (2017)
8
8
  url: https://www.loc.gov/catdir/cpso/romanization/bengali.pdf
9
9
  creation_date: 2017
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bul
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: ALA-LC Romanization Table -- Bulgarian (1997)
7
+ name: Romanization Table -- Bulgarian (1997)
8
8
  url: http://www.rechtertie.nl/databases/judd/downloads/Bulgarian.pdf
9
9
  creation_date: 1997
10
10
 
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:div
5
5
  source_script: Thaa
6
6
  destination_script: Latn
7
- name: ALA-Library of Congress Divehi Romanization 1997 System
7
+ name: Romanization Table -- Divehi (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/divehi.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -0,0 +1,74 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2012
4
+ language: iso-639-2:div
5
+ source_script: Thaa
6
+ destination_script: Latn
7
+ name: Romanization Table -- Divehi (2012)
8
+ url: https://www.loc.gov/catdir/cpso/romanization/divehi.pdf
9
+ creation_date: 2012
10
+ description: |
11
+ ALA-Library of Congress Divehi Romanization 2012 System
12
+
13
+ notes:
14
+
15
+ - |
16
+ Romanize ށް as ḫ when it doubles the following consonant or is used as a glottal stop.
17
+ aḫvana އަށްވަނަ
18
+ maśaḫ މަށަށް
19
+ - |
20
+ When used in medial position without ް (sukūn), romanize ނ as ṁ.
21
+ aṁga އަނގަ
22
+ haṁdu ހަނދު
23
+ - |
24
+ Romanization of އ.
25
+ (a) When used in the initial position with any vowel sign, do not romanize.
26
+ ata އަތަ
27
+ idu އިދު
28
+ umuru އުމުރު
29
+ egahugi އެގަހުގި
30
+ (b) When used in the medial position with any vowel sign, romanize as ’.
31
+ ha’hūnu ހައިހޫނު
32
+ fa’isa ފައިސަ
33
+ k’īn ކްއީން
34
+ (c) When a consonant follows އް in medial position, double it in romanization.
35
+ cappalu ޗައްޕަލު
36
+ appacci އައްޕައްޗި
37
+ (d) When used in final position with ް (sukūn), romanize as h.
38
+ boh ބޮއް
39
+ biheh ބިހެއް
40
+ - |
41
+ Romanize ތް followed by another ތ as t̤ .
42
+ at̤teri އަތްތެރި
43
+ - |
44
+ Only the vowel forms that appear at the beginning of a syllable are listed.
45
+ When the vowels follow a consonant, އ is not used and the vowel signs are added to the consonant forms.
46
+ Do not distinguish between the two in romanization.
47
+ - |
48
+ ް (called sukūn) generally indicates omission of an inherent vowel associated with a consonant.
49
+ For its other uses, see Notes 1, 3, and 4.
50
+ }
51
+
52
+ tests {
53
+ test "މަށަށް", "maśaḫ"
54
+ test "އަނގަ", "aṁga"
55
+ test "ހަނދު", "haṁdu"
56
+ test "އަތަ", "ata"
57
+ test "އިދު", "idu"
58
+ test "އުމުރު", "umuru"
59
+ test "އެގަހުގި", "egahugi"
60
+ test "ފައިސަ", "faʼisa"
61
+ test "ބޮއް", "boh"
62
+ test "ބިހެއް", "biheh"
63
+ test "އަތްތެރި", "at̤teri"
64
+ test "ޗައްޕަލު", "cappalu"
65
+ test "އައްޕައްޗި", "appacci"
66
+ }
67
+
68
+ dependency "alalc-div-Thaa-Latn-1997", as: thaalatn
69
+
70
+ stage {
71
+
72
+ run map.thaalatn.stage.main
73
+
74
+ }
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: Greek Romanization, 1997
7
+ name: Romanization Table -- Greek (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/greek.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
- name: Greek Romanization, 2010
7
+ name: Romanization Table -- Greek (2010)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/greek.pdf
9
9
  creation_date: 2010
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:guj
5
5
  source_script: Gujr
6
6
  destination_script: Latn
7
- name: Gujarati Romanization, 1997
7
+ name: Romanization Table -- Gujarati (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/gujarati.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:guj
5
5
  source_script: Gujr
6
6
  destination_script: Latn
7
- name: Gujarati Romanization, 2011
7
+ name: Romanization Table -- Gujarati (2011)
8
8
  url: https://www.loc.gov/catdir/cpso/romanization/gujarati.pdf
9
9
  creation_date: 2011
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Hindi Romanization, 1997
7
+ name: Romanization Table -- Hindi (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/hindi.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Hindi Romanization, 2011
7
+ name: Romanization Table -- Hindi (2011)
8
8
  url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kan
5
5
  source_script: Kana
6
6
  destination_script: Latn
7
- name: Kannada Romanization, 1997
7
+ name: Romanization Table -- Kannada (1997)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
9
9
  creation_date: 1997
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kan
5
5
  source_script: Kana
6
6
  destination_script: Latn
7
- name: Kannada Romanization, 2011
7
+ name: Romanization Table -- Kannada (2011)
8
8
  url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
9
9
  creation_date: 2011
10
10
  description: |
@@ -4,13 +4,12 @@ metadata {
4
4
  language: iso-639-2:kat
5
5
  source_script: Geok
6
6
  destination_script: Latn
7
- name: ALA-LC Georgian System (1997)
8
- url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
7
+ name: Romanization Table -- Georgian Khutsuri (1997)
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/georgian.pdf
9
9
  creation_date: 1997
10
10
  confirmation_date: 1997
11
11
  description: |
12
12
  Values are shown for the Khutsuri alphabet.
13
-
14
13
  notes:
15
14
  }
16
15
 
@@ -64,7 +63,7 @@ stage {
64
63
  sub "\u10c3", "W" # Ⴣ
65
64
  sub "\u10c4", "X̣" # Ⴤ
66
65
  sub "\u10c5", "Ō" # Ⴥ
67
-
66
+
68
67
  sub "\u2d00", "a" # ⴀ
69
68
  sub "\u2d01", "b" # ⴁ
70
69
  sub "\u2d02", "g" # ⴂ
@@ -0,0 +1,31 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:kat
5
+ source_script: Geok
6
+ destination_script: Latn
7
+ name: Romanization Table -- Georgian Khutsuri (2011)
8
+ url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
9
+ creation_date: 2011
10
+ confirmation_date: 2011
11
+ description: |
12
+ Values are shown for the Khutsuri alphabet.
13
+ notes:
14
+ }
15
+
16
+ tests {
17
+ test "ႼႨႢႬႨ", "CIGNI"
18
+ test "ⴜⴈⴂⴌⴈ", "cigni"
19
+ test "ႱႭႪႭႫႭႬ", "SOLOMON"
20
+ test "ⴑⴍⴊⴍⴋⴍⴌ", "solomon"
21
+ test "ႠႡႰႠჀႠႫ", "ABRAHAM"
22
+ }
23
+
24
+
25
+ dependency "alalc-kat-Geok-Latn-1997", as: geoklatn
26
+
27
+ stage {
28
+
29
+ run map.geoklatn.stage.main
30
+
31
+ }
@@ -4,14 +4,13 @@ metadata {
4
4
  language: iso-639-2:kat
5
5
  source_script: Geor
6
6
  destination_script: Latn
7
- name: ALA-LC Georgian System (1997)
8
- url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
7
+ name: Romanization Table -- Georgian Mkhedruli (1997)
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/georgian.pdf
9
9
  creation_date: 1997
10
10
  confirmation_date: 1997
11
11
  description: |
12
12
  Values are shown for the older Khutsuri and the modern Mkhedruli alphabets.
13
13
  There are no upper case letters in Mkhedruli.
14
-
15
14
  notes:
16
15
  }
17
16
 
@@ -54,27 +53,27 @@ stage {
54
53
  sub "\u10d4", "e" # ე
55
54
  sub "\u10d5", "v" # ვ
56
55
  sub "\u10d6", "z" # ზ
57
-
56
+
58
57
  sub "\u10f1", "ē" # ჱ
59
-
58
+
60
59
  sub "\u10d7", "tʻ" # თ
61
60
  sub "\u10d8", "i" # ი
62
61
  sub "\u10d9", "k" # კ
63
62
  sub "\u10da", "l" # ლ
64
63
  sub "\u10db", "m" # მ
65
64
  sub "\u10dc", "n" # ნ
66
-
65
+
67
66
  sub "\u10f2", "y" # ჲ
68
-
67
+
69
68
  sub "\u10dd", "o" # ო
70
69
  sub "\u10de", "p" # პ
71
70
  sub "\u10df", "ž" # ჟ
72
71
  sub "\u10e0", "r" # რ
73
72
  sub "\u10e1", "s" # ს
74
73
  sub "\u10e2", "t" # ტ
75
-
74
+
76
75
  sub "\u10f3", "w" # ჳ
77
-
76
+
78
77
  sub "\u10e3", "u" # უ
79
78
  sub "\u10e4", "pʻ" # ფ
80
79
  sub "\u10e5", "kʻ" # ქ
@@ -87,14 +86,14 @@ stage {
87
86
  sub "\u10ec", "c" # წ
88
87
  sub "\u10ed", "č" # ჭ
89
88
  sub "\u10ee", "x" # ხ
90
-
89
+
91
90
  sub "\u10f4", "x̣" # ჴ
92
-
91
+
93
92
  sub "\u10ef", "j" # ჯ
94
93
  sub "\u10f0", "h" # ჰ
95
-
94
+
96
95
  sub "\u10f5", "ō" # ჵ
97
-
96
+
98
97
  sub "\u10f6", "f" # ჶ
99
98
  sub "\u10f7", "ĕ" # ჷ
100
99
  sub "\u10f8", "ʻ" # ჸ