interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,356 @@
1
+ metadata {
2
+ authority_id: ungegn
3
+ id: 2016
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
8
+ url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
+ (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
+ published in volume II of the conference reports.
15
+
16
+ There is no evidence of the use of the system either in India or in international cartographic
17
+ products. It was stated in 1987 that the appropriate resolution had not been implemented in
18
+ India and the Hunterian system was still in use in large-scale mapping
19
+
20
+ Hindi uses the alphasyllabic script Devanāgarī whereby each character represents a syllable
21
+ rather than one sound. Vowels and diphthongs are marked in two ways: as independent
22
+ characters (used syllable-initially) and in an abbreviated form, to denote vowels after
23
+ consonants. The romanization table is unambiguous but the user would have to recognize
24
+ many ligatures not given in the original table (only three are given). The system is mostly
25
+ reversible but there may exist some ambiguities in the romanization of vowels (independent
26
+ vs. abbreviated characters) and consonants
27
+
28
+ notes:
29
+ - |
30
+ It is recommended that the vowel अ (a) should always be romanized except when it ends a
31
+ name. If a name ends with a consonant, the consonant should carry a sub-macron. Such
32
+ cases, however, will be very rare. For example, कानपुर Kānapur (not Kānapura), जगत्
33
+ Jagat.
34
+ - |
35
+ If each letter of a digraph or any two parts of a trigraph has a distinct independent sound
36
+ then it should be indicated by a hyphen, thus d-h.
37
+
38
+ ######################################## Additional Note ############################################################
39
+ # It is recommended that the vowel अ (a) should always be romanized except when it ends a #
40
+ # name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
41
+ # we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
42
+ # so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
43
+ #####################################################################################################################
44
+ }
45
+
46
+ tests {
47
+ test "दिल्ली", "dillī"
48
+ test "भारत", "bhārat"
49
+ test "परिपक्क", "paripakk"
50
+ test "जगत्", "jagat"
51
+ test "संख्या", "saṁkhyā"
52
+ test "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर", "gaṁbhīr marījoṁ ke māmale meṁ bhārat dūsare naṁbar par"
53
+ test "कोरोना अपडेट्स", "koronā apaḍeṭs"
54
+ test "सीडीसी चीफ का बयान अहम", "sīḍīsī chīph kā bayān aham"
55
+ test "गूगल प्ले स्टोर पर पेटीएम की वापसी", "gūgal ple sṭor par peṭīem kī vāpasī"
56
+ test "भारत में गैंबलिंग की इजाजत नहीं", "bhārat meṁ gaiṁbaliṁg kī ijājat nahīṁ"
57
+ test "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं", "koronā vaiksīn mudde par ghire rāṣhṭrapati; jo bāiḍen bole- mujhe aur desh ko vaijñānikoṁ par bharosā hai, ḍonālḍ ṭramp par nahīṁ"
58
+ test "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं", "gūgal kī kārravāī par peṭīem ne kahā thā ki aip ko asthāyī taur par ple-sṭor se haṭāyā gayā hai, āpake paise surakṣhit haiṁ"
59
+ }
60
+
61
+
62
+ aliases {
63
+ def_alias deva_characters_1, any("\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d")
64
+ }
65
+
66
+ stage {
67
+
68
+ # RULES
69
+ sub "क" + maybe("="), "k", after: deva_characters_1
70
+ sub "क", "k", after: boundary
71
+
72
+ sub "ख" + maybe("="), "kh", after: deva_characters_1
73
+ sub "ख", "kh", after: boundary
74
+
75
+ sub "ग" + maybe("="), "g", after: deva_characters_1
76
+ sub "ग", "g", after: boundary
77
+
78
+ sub "घ" + maybe("="), "gh", after: deva_characters_1
79
+ sub "घ", "gh", after: boundary
80
+
81
+ sub "ङ" + maybe("="), "ṅ", after: deva_characters_1
82
+ sub "ङ", "ṅ", after: boundary
83
+
84
+ sub "च" + maybe("="), "ch", after: deva_characters_1
85
+ sub "च", "ch", after: boundary
86
+
87
+ sub "छ" + maybe("="), "chh", after: deva_characters_1
88
+ sub "छ", "chh", after: boundary
89
+
90
+ sub "ज" + maybe("="), "j", after: deva_characters_1
91
+ sub "ज", "j", after: boundary
92
+
93
+ sub "झ" + maybe("="), "jh", after: deva_characters_1
94
+ sub "झ", "jh", after: boundary
95
+
96
+ sub "ञ" + maybe("="), "ñ", after: deva_characters_1
97
+ sub "ञ", "ñ", after: boundary
98
+
99
+ sub "ट" + maybe("="), "ṭ", after: deva_characters_1
100
+ sub "ट", "ṭ", after: boundary
101
+
102
+ sub "ठ" + maybe("="), "ṭh", after: deva_characters_1
103
+ sub "ठ", "ṭh", after: boundary
104
+
105
+ sub "ड" + maybe("="), "ḍ", after: deva_characters_1
106
+ sub "ड", "ḍ", after: boundary
107
+
108
+ sub "ढ" + maybe("="), "ḍh", after: deva_characters_1
109
+ sub "ढ", "ḍh", after: boundary
110
+
111
+ sub "ण" + maybe("="), "ṇ", after: deva_characters_1
112
+ sub "ण", "ṇ", after: boundary
113
+
114
+ sub "त" + maybe("="), "t", after: deva_characters_1
115
+ sub "त", "t", after: boundary
116
+
117
+ sub "थ" + maybe("="), "th", after: deva_characters_1
118
+ sub "थ", "th", after: boundary
119
+
120
+ sub "द" + maybe("="), "d", after: deva_characters_1
121
+ sub "द", "d", after: boundary
122
+
123
+ sub "ध" + maybe("="), "dh", after: deva_characters_1
124
+ sub "ध", "dh", after: boundary
125
+
126
+ sub "न" + maybe("="), "n", after: deva_characters_1
127
+ sub "न", "n", after: boundary
128
+
129
+ sub "प" + maybe("="), "p", after: deva_characters_1
130
+ sub "प", "p", after: boundary
131
+
132
+ sub "फ" + maybe("="), "ph", after: deva_characters_1
133
+ sub "फ", "ph", after: boundary
134
+
135
+ sub "ब" + maybe("="), "b", after: deva_characters_1
136
+ sub "ब", "b", after: boundary
137
+
138
+ sub "भ" + maybe("="), "bh", after: deva_characters_1
139
+ sub "भ", "bh", after: boundary
140
+
141
+ sub "म" + maybe("="), "m", after: deva_characters_1
142
+ sub "म", "m", after: boundary
143
+
144
+ sub "य" + maybe("="), "y", after: deva_characters_1
145
+ sub "य", "y", after: boundary
146
+
147
+ sub "र" + maybe("="), "r", after: deva_characters_1
148
+ sub "र", "r", after: boundary
149
+
150
+ sub "ल" + maybe("="), "l", after: deva_characters_1
151
+ sub "ल", "l", after: boundary
152
+
153
+ sub "व" + maybe("="), "v", after: deva_characters_1
154
+ sub "व", "v", after: boundary
155
+
156
+ sub "श" + maybe("="), "sh", after: deva_characters_1
157
+ sub "श", "sh", after: boundary
158
+
159
+ sub "ष" + maybe("="), "ṣh", after: deva_characters_1
160
+ sub "ष", "ṣh", after: boundary
161
+
162
+ sub "स" + maybe("="), "s", after: deva_characters_1
163
+ sub "स", "s", after: boundary
164
+
165
+ sub "क़" + maybe("="), "q", after: deva_characters_1
166
+ sub "क़", "q", after: boundary
167
+
168
+ sub "ख़" + maybe("="), "ḳh", after: deva_characters_1
169
+ sub "ख़", "ḳh", after: boundary
170
+
171
+ sub "ग़" + maybe("="), "g", after: deva_characters_1
172
+ sub "ग़", "g", after: boundary
173
+
174
+ sub "ज़" + maybe("="), "z", after: deva_characters_1
175
+ sub "ज़", "z", after: boundary
176
+
177
+ sub "ड़" + maybe("="), "ṙ", after: deva_characters_1
178
+ sub "ड़", "ṙ", after: boundary
179
+
180
+ sub "ढ़" + maybe("="), "ṙh", after: deva_characters_1
181
+ sub "ढ़", "ṙh", after: boundary
182
+
183
+ sub "फ़" + maybe("="), "f", after: deva_characters_1
184
+ sub "फ़", "f", after: boundary
185
+
186
+ sub "ह" + maybe("="), "h", after: deva_characters_1
187
+ sub "ह", "h", after: boundary
188
+
189
+
190
+ # CHARACTERS
191
+ parallel {
192
+
193
+ # I. Independent vowel characters
194
+ sub "अ", "a"
195
+ sub "आ", "ā"
196
+ sub "इ", "i"
197
+ sub "ई", "ī"
198
+ sub "उ", "u"
199
+ sub "ऊ", "ū"
200
+ sub "ऋ", "ṛ"
201
+ sub "ॠ", "ṝ"
202
+ sub "ऌ", "l̤"
203
+ sub "ए", "e"
204
+ sub "ऐ", "ai"
205
+ sub "ओ", "o"
206
+ sub "औ", "au"
207
+
208
+ # II. Abbreviated vowel characters
209
+
210
+ sub "ा", "ā" # का
211
+ sub "ॉ", "ā̆ " # additional mark: कॉ
212
+ sub "ि", "i" # कि i
213
+ sub "ी", "ī" # की
214
+ sub "ु", "u" # कु
215
+ sub "ू", "ū" # कू
216
+ sub "ृ", "ṛ" # कृ
217
+ sub "े", "e" # के
218
+ sub "ै", "ai" # कै
219
+ sub "ो", "o" # को
220
+ sub "ौ", "au" # कौ
221
+
222
+
223
+ # Consonants (see Note 1)
224
+
225
+ # Gutturals
226
+ sub "क", "ka"
227
+ sub "ख", "kha"
228
+ sub "ग", "ga"
229
+ sub "घ", "gha"
230
+ sub "ङ", "ṅa"
231
+
232
+ # Palatals
233
+ sub "च", "cha"
234
+ sub "छ", "chha"
235
+ sub "ज", "ja"
236
+ sub "झ", "jha"
237
+ sub "ञ", "ña"
238
+
239
+ # Cerebrals
240
+ sub "ट", "ṭa"
241
+ sub "ठ", "ṭha"
242
+ sub "ड", "ḍa"
243
+ sub "ढ", "ḍha"
244
+ sub "ण", "ṇa"
245
+
246
+ # Dentals
247
+ sub "त", "ta"
248
+ sub "थ", "tha"
249
+ sub "द", "da"
250
+ sub "ध", "dha"
251
+ sub "न", "na"
252
+
253
+ # Labials
254
+ sub "प", "pa"
255
+ sub "फ", "pha"
256
+ sub "ब", "ba"
257
+ sub "भ", "bha"
258
+ sub "म", "ma"
259
+
260
+ # Semivowels
261
+ sub "य", "ya"
262
+ sub "र", "ra"
263
+ sub "ल", "la"
264
+ sub "व", "va"
265
+
266
+ # Sibilants
267
+ sub "श", "sha"
268
+ sub "ष", "ṣha"
269
+ sub "स", "sa"
270
+
271
+ # Dotted variants
272
+ sub "क़", "qa"
273
+ sub "ख़", "ḳha"
274
+ sub "ग़", "ġa"
275
+ sub "ज़", "za"
276
+ sub "ड़", "ṙa"
277
+ sub "ढ़", "ṙha"
278
+ sub "फ़", "fa"
279
+
280
+
281
+ # Aspirate
282
+ sub "ह", "ha"
283
+
284
+ # Anusvāra
285
+ sub "ं", "ṁ"
286
+
287
+ # Anunāsika
288
+ sub "ँ", "m̐"
289
+
290
+ # halanta
291
+ sub "्", ""
292
+
293
+ # bisharga
294
+ sub "ः", "ḥ"
295
+
296
+ #V. Ligatures(To cover all Ligatures at unicode)
297
+ # Implemnting Pronunciation without a vowel: क् k.
298
+
299
+ # Gutturals
300
+ sub "क्", "k"
301
+ sub "ख्", "kh"
302
+ sub "ग्", "g"
303
+ sub "घ्", "gh"
304
+ sub "ङ्", "ṅ"
305
+
306
+ # Palatals
307
+ sub "च्", "ch"
308
+ sub "छ्", "chh"
309
+ sub "ज्", "j"
310
+ sub "झ्", "jh"
311
+ sub "ञ्", "ñ"
312
+
313
+ # Cerebrals
314
+ sub "ट्", "ṭ"
315
+ sub "ठ्", "ṭh"
316
+ sub "ड्", "ḍ"
317
+ sub "ढ्", "ḍh"
318
+ sub "ण्", "ṇ"
319
+
320
+ # Dentals
321
+ sub "त्", "t"
322
+ sub "थ्", "th"
323
+ sub "द्", "d"
324
+ sub "ध्", "dh"
325
+ sub "न्", "n"
326
+
327
+ # Labials
328
+ sub "प्", "p"
329
+ sub "फ्", "ph"
330
+ sub "ब्", "b"
331
+ sub "भ्", "bh"
332
+ sub "म्", "m"
333
+
334
+ # Semivowels
335
+ sub "य्", "y"
336
+ sub "र्", "r"
337
+ sub "ल्", "l"
338
+ sub "व्", "v"
339
+
340
+ # Sibilants
341
+ sub "श्", "sh"
342
+ sub "ष्", "ṣh"
343
+ sub "स्", "s"
344
+
345
+ # Dotted variants
346
+ sub "क़्", "q"
347
+ sub "ख़्", "ḳh"
348
+ sub "ग़्", "ġ"
349
+ sub "ज़्", "z"
350
+ sub "ड़्", "ṙ"
351
+ sub "ढ़्", "ṙh"
352
+ sub "फ़्", "f"
353
+ }
354
+ compose
355
+ }
356
+
@@ -0,0 +1,214 @@
1
+ metadata {
2
+ authority_id: ungegn
3
+ id: 2016
4
+ language: iso-639-2:kan
5
+ source_script: Kana
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
8
+ url: https://www.eki.ee/wgrs/rom1_kn.pdf
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
+ (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
+ published in volume II of the conference reports
15
+
16
+ There is no evidence of the use of the system either in India or in international cartographic
17
+ products.
18
+
19
+ Kannada uses an alphasyllabic script whereby each character represents a syllable rather than
20
+ one sound. Vowels and diphthongs are marked in two ways: as independent characters (used
21
+ syllable-initially) and in an abbreviated form, to denote vowels after consonants. The
22
+ romanization table is unambiguous. The system is mostly reversible but there may exist some
23
+ ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
24
+ consonants (combinations with subscript consonants vs. character sequences).
25
+
26
+ notes:
27
+ - |
28
+ While most consonants have a diacritic in the upper right corner of the character (like ಕ),
29
+ some do not, e.g. ಖ kha, ಜ ja, ನ na, ಬ ba, ಲ la.
30
+ - |
31
+ Combinations with r as the first component are written by adding a special symbol after the
32
+ second consonant: ರ್ಗ rga.
33
+ }
34
+
35
+ tests {
36
+ test "ಕರ್ಣಾಟಕ", "karṇāṭaka"
37
+ test "ಬೆಂಗಳೂರು", "bĕṁgaḷūru"
38
+ test "ಮಹಾರಾಷ್ಟ್ರದ ಯಾವುದೇ ಪ್ರಕರಣದ ತನಿಖೆಗೆ ಇನ್ನು ಸಿಬಿಐ ಪಡೆಯಬೇಕು ಅನುಮತಿ", "mahārāṣhṭrada yāvude prakaraṇada tanikhĕgĕ innu sibiai paḍĕyabeku anumati"
39
+ test "ಹರಕು ಬಾಯಿ: ಈಶ್ವರಪ್ಪಗೆ ಶಾಸಕ ಯತ್ನಾಳ ತಿರುಗೇಟು", "haraku bāyi: īshvarappagĕ shāsaka yatnāḷa tirugeṭu"
40
+ test "ಹಾಥರಸ್‌ ಪ್ರಕರಣ: ೨೯ರಂದು ರಾಷ್ಟ್ರವ್ಯಾಪಿ ಪ್ರತಿಭಟನೆಗೆ ಮಹಿಳಾ ಸಂಘಟನೆಗಳ ಕರೆ", "hātharas prakaraṇa: 29raṁdu rāṣhṭravyāpi pratibhaṭanĕgĕ mahiḷā saṁghaṭanĕgaḷa karĕ"
41
+ test "ಪೊಲೀಸ್‌ ಮಕ್ಕಳ ಶಾಲೆ ಮುಚ್ಚುವ ಯತ್ನಕ್ಕೆ ಹೊರಟ್ಟಿ ತೀವ್ರ ವಿರೋಧ", "pŏlīs makkaḷa shālĕ muchchuva yatnakkĕ hŏraṭṭi tīvra virodha"
42
+ test "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ: ಟ್ರಂಪ್‌–ಬೈಡನ್‌ ಅಂತಿಮ ಮುಖಾಮುಖಿಗೆ ವೇದಿಕೆ ಸಿದ್ಧ", "amĕrika adhyakṣhīya chunāvaṇĕ: ṭraṁp–baiḍan aṁtima mukhāmukhigĕ vedikĕ siddha"
43
+ test "ಅಂಜನಾದ್ರಿ ಆಂಜನೇಯನ ದರ್ಶನ ಪಡೆದ ಪವರ್ ಸ್ಟಾರ್ ಪುನೀತ್ ರಾಜ್ ಕುಮಾರ್", "aṁjanādri āṁjaneyana darshana paḍĕda pavar sṭār punīt rāj kumār"
44
+ test "ಇನ್ನು ಹಿಂದೂ ದೇವಸ್ಥಾನದ ಧಾರ್ಮಿಕ ಕಾರ್ಯದಲ್ಲಿ ಭಾಗಿಯಾಗಿದ್ದಕ್ಕೆ ಮೋಯಿದ್ದೀನ್ ಬಾವಾಗೆ ಬೆದರಿಕೆ ಒಡ್ಡಲಾಗಿದೆ", "innu hiṁdū devasthānada dhārmika kāryadalli bhāgiyāgiddakkĕ moyiddīn bāvāgĕ bĕdarikĕ ŏḍḍalāgidĕ"
45
+ test "ಇದು ಮೋದಿ ದೇಶ - ದನ ತಿಂದು ಹೋದ್ರೆ ಹುಷಾರ್ : ದೇಗುಲಕ್ಕೆ ಹೋಗಿದ್ದ ಬಾವಾಗೆ ಬೆದರಿಕೆ", "idu modi desha - dana tiṁdu hodrĕ huṣhār : degulakkĕ hogidda bāvāgĕ bĕdarikĕ"
46
+ }
47
+
48
+ aliases {
49
+ def_alias characters_set1, any("\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd")
50
+ }
51
+
52
+ stage {
53
+
54
+ # RULES
55
+ # to cover diacritic and vowel less consonants
56
+ sub "ಕ", "k", after: characters_set1
57
+ sub "ಖ", "kh", after: characters_set1
58
+ sub "ಗ", "g", after: characters_set1
59
+ sub "ಘ", "gh", after: characters_set1
60
+ sub "ಙ", "ṅ", after: characters_set1
61
+ sub "ಚ", "ch", after: characters_set1
62
+ sub "ಛ", "chh", after: characters_set1
63
+ sub "ಜ", "j", after: characters_set1
64
+ sub "ಝ", "jh", after: characters_set1
65
+ sub "ಞ", "ñ", after: characters_set1
66
+ sub "ಟ", "ṭ", after: characters_set1
67
+ sub "ಠ", "ṭh", after: characters_set1
68
+ sub "ಡ", "ḍ", after: characters_set1
69
+ sub "ಢ", "ḍh", after: characters_set1
70
+ sub "ಣ", "ṇ", after: characters_set1
71
+ sub "ತ", "t", after: characters_set1
72
+ sub "ಥ", "th", after: characters_set1
73
+ sub "ದ", "d", after: characters_set1
74
+ sub "ಧ", "dh", after: characters_set1
75
+ sub "ನ", "n", after: characters_set1
76
+ sub "ಪ", "p", after: characters_set1
77
+ sub "ಫ", "ph", after: characters_set1
78
+ sub "ಬ", "b", after: characters_set1
79
+ sub "ಭ", "bh", after: characters_set1
80
+ sub "ಮ", "m", after: characters_set1
81
+ sub "ಯ", "y", after: characters_set1
82
+ sub "ರ", "r", after: characters_set1
83
+ sub "ಲ", "l", after: characters_set1
84
+ sub "ಳ", "ḷ", after: characters_set1
85
+ sub "ವ", "v", after: characters_set1
86
+ sub "ಶ", "sh", after: characters_set1
87
+ sub "ಷ", "ṣh", after: characters_set1
88
+ sub "ಸ", "s", after: characters_set1
89
+ sub "ಹ", "h", after: characters_set1
90
+
91
+
92
+ # CHARACTERS
93
+ parallel {
94
+ sub "ಅ", "a"
95
+ sub "ಆ", "ā"
96
+ sub "ಇ", "i"
97
+ sub "ಈ", "ī"
98
+ sub "ಉ", "u"
99
+ sub "ಊ", "ū"
100
+ sub "ಋ", "ṛ"
101
+
102
+ sub "ಎ", "ĕ"
103
+ sub "ಏ", "e"
104
+ sub "ಐ", "ai"
105
+
106
+ sub "ಒ", "ŏ"
107
+ sub "ಓ", "o"
108
+ sub "ಔ", "au"
109
+
110
+ # Gutturals
111
+ sub "ಕ", "ka"
112
+ sub "ಖ", "kha"
113
+ sub "ಗ", "ga"
114
+ sub "ಘ", "gha"
115
+ sub "ಙ", "ṅa"
116
+
117
+ # Palatals
118
+ sub "ಚ", "cha"
119
+ sub "ಛ", "chha"
120
+ sub "ಜ", "ja"
121
+ sub "ಝ", "jha"
122
+ sub "ಞ", "ña"
123
+
124
+ # Cerebrals
125
+ sub "ಟ", "ṭa"
126
+ sub "ಠ", "ṭha"
127
+ sub "ಡ", "ḍa"
128
+ sub "ಢ", "ḍha"
129
+ sub "ಣ", "ṇa"
130
+
131
+ # Dentals
132
+ sub "ತ", "ta"
133
+ sub "ಥ", "tha"
134
+ sub "ದ", "da"
135
+ sub "ಧ", "dha"
136
+ sub "ನ", "na"
137
+
138
+ # Labials
139
+ sub "ಪ", "pa"
140
+ sub "ಫ", "pha"
141
+ sub "ಬ", "ba"
142
+ sub "ಭ", "bha"
143
+ sub "ಮ", "ma"
144
+
145
+ # Semivowels
146
+ sub "ಯ", "ya"
147
+ sub "ರ", "ra"
148
+ sub "ಲ", "la"
149
+ sub "ಳ", "ḷa"
150
+
151
+
152
+ sub "ವ", "va"
153
+
154
+ # Sibilants
155
+ sub "ಶ", "sha"
156
+ sub "ಷ", "ṣha"
157
+ sub "ಸ", "sa"
158
+
159
+
160
+ # Aspirate
161
+ sub "ಹ", "ha"
162
+
163
+
164
+ # Bisarga
165
+ sub "ಃ", "ḥ"
166
+
167
+ # Anusvāra
168
+ sub "ಂ", "ṁ"
169
+
170
+ sub "\u0cbc", "" #nukta
171
+
172
+ # Medials # Needed for connecting constants
173
+ sub "ಾ", "ā"
174
+ sub "ಿ", "i"
175
+ sub "ೀ", "ī"
176
+ sub "ು", "u"
177
+ sub "ೂ", "ū"
178
+ sub "ೃ", "ṛ"
179
+
180
+
181
+ sub "ೆ", "ĕ"
182
+ sub "ೇ", "e"
183
+ sub "ೈ", "ai"
184
+
185
+
186
+ sub "ೊ", "ŏ"
187
+ sub "ೋ", "o"
188
+ sub "ೌ", "au"
189
+
190
+
191
+ sub "्", ""
192
+ sub "़", ""
193
+ sub "್", "" # used for pronounciation without vowel
194
+ sub "‍", "" # no need for zero with joiner
195
+ sub "‌", "" # no need for zero with non joiner
196
+
197
+
198
+
199
+ # Digits
200
+
201
+ sub "೦", "0"
202
+ sub "೧", "1"
203
+ sub "೨", "2"
204
+ sub "೩", "3"
205
+ sub "೪", "4"
206
+ sub "೫", "5"
207
+ sub "೬", "6"
208
+ sub "೭", "7"
209
+ sub "೮", "8"
210
+ sub "೯", "9"
211
+ }
212
+
213
+ compose
214
+ }