interscript-maps 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,356 @@
1
+ metadata {
2
+ authority_id: ungegn
3
+ id: 2016
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
8
+ url: https://www.eki.ee/wgrs/rom1_hi.pdf
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
+ (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
+ published in volume II of the conference reports.
15
+
16
+ There is no evidence of the use of the system either in India or in international cartographic
17
+ products. It was stated in 1987 that the appropriate resolution had not been implemented in
18
+ India and the Hunterian system was still in use in large-scale mapping
19
+
20
+ Hindi uses the alphasyllabic script Devanāgarī whereby each character represents a syllable
21
+ rather than one sound. Vowels and diphthongs are marked in two ways: as independent
22
+ characters (used syllable-initially) and in an abbreviated form, to denote vowels after
23
+ consonants. The romanization table is unambiguous but the user would have to recognize
24
+ many ligatures not given in the original table (only three are given). The system is mostly
25
+ reversible but there may exist some ambiguities in the romanization of vowels (independent
26
+ vs. abbreviated characters) and consonants
27
+
28
+ notes:
29
+ - |
30
+ It is recommended that the vowel अ (a) should always be romanized except when it ends a
31
+ name. If a name ends with a consonant, the consonant should carry a sub-macron. Such
32
+ cases, however, will be very rare. For example, कानपुर Kānapur (not Kānapura), जगत्
33
+ Jagat.
34
+ - |
35
+ If each letter of a digraph or any two parts of a trigraph has a distinct independent sound
36
+ then it should be indicated by a hyphen, thus d-h.
37
+
38
+ ######################################## Additional Note ############################################################
39
+ # It is recommended that the vowel अ (a) should always be romanized except when it ends a #
40
+ # name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
41
+ # we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
42
+ # so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
43
+ #####################################################################################################################
44
+ }
45
+
46
+ tests {
47
+ test "दिल्ली", "dillī"
48
+ test "भारत", "bhārat"
49
+ test "परिपक्क", "paripakk"
50
+ test "जगत्", "jagat"
51
+ test "संख्या", "saṁkhyā"
52
+ test "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर", "gaṁbhīr marījoṁ ke māmale meṁ bhārat dūsare naṁbar par"
53
+ test "कोरोना अपडेट्स", "koronā apaḍeṭs"
54
+ test "सीडीसी चीफ का बयान अहम", "sīḍīsī chīph kā bayān aham"
55
+ test "गूगल प्ले स्टोर पर पेटीएम की वापसी", "gūgal ple sṭor par peṭīem kī vāpasī"
56
+ test "भारत में गैंबलिंग की इजाजत नहीं", "bhārat meṁ gaiṁbaliṁg kī ijājat nahīṁ"
57
+ test "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं", "koronā vaiksīn mudde par ghire rāṣhṭrapati; jo bāiḍen bole- mujhe aur desh ko vaijñānikoṁ par bharosā hai, ḍonālḍ ṭramp par nahīṁ"
58
+ test "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं", "gūgal kī kārravāī par peṭīem ne kahā thā ki aip ko asthāyī taur par ple-sṭor se haṭāyā gayā hai, āpake paise surakṣhit haiṁ"
59
+ }
60
+
61
+
62
+ aliases {
63
+ def_alias deva_characters_1, any("\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d")
64
+ }
65
+
66
+ stage {
67
+
68
+ # RULES
69
+ sub "क" + maybe("="), "k", after: deva_characters_1
70
+ sub "क", "k", after: boundary
71
+
72
+ sub "ख" + maybe("="), "kh", after: deva_characters_1
73
+ sub "ख", "kh", after: boundary
74
+
75
+ sub "ग" + maybe("="), "g", after: deva_characters_1
76
+ sub "ग", "g", after: boundary
77
+
78
+ sub "घ" + maybe("="), "gh", after: deva_characters_1
79
+ sub "घ", "gh", after: boundary
80
+
81
+ sub "ङ" + maybe("="), "ṅ", after: deva_characters_1
82
+ sub "ङ", "ṅ", after: boundary
83
+
84
+ sub "च" + maybe("="), "ch", after: deva_characters_1
85
+ sub "च", "ch", after: boundary
86
+
87
+ sub "छ" + maybe("="), "chh", after: deva_characters_1
88
+ sub "छ", "chh", after: boundary
89
+
90
+ sub "ज" + maybe("="), "j", after: deva_characters_1
91
+ sub "ज", "j", after: boundary
92
+
93
+ sub "झ" + maybe("="), "jh", after: deva_characters_1
94
+ sub "झ", "jh", after: boundary
95
+
96
+ sub "ञ" + maybe("="), "ñ", after: deva_characters_1
97
+ sub "ञ", "ñ", after: boundary
98
+
99
+ sub "ट" + maybe("="), "ṭ", after: deva_characters_1
100
+ sub "ट", "ṭ", after: boundary
101
+
102
+ sub "ठ" + maybe("="), "ṭh", after: deva_characters_1
103
+ sub "ठ", "ṭh", after: boundary
104
+
105
+ sub "ड" + maybe("="), "ḍ", after: deva_characters_1
106
+ sub "ड", "ḍ", after: boundary
107
+
108
+ sub "ढ" + maybe("="), "ḍh", after: deva_characters_1
109
+ sub "ढ", "ḍh", after: boundary
110
+
111
+ sub "ण" + maybe("="), "ṇ", after: deva_characters_1
112
+ sub "ण", "ṇ", after: boundary
113
+
114
+ sub "त" + maybe("="), "t", after: deva_characters_1
115
+ sub "त", "t", after: boundary
116
+
117
+ sub "थ" + maybe("="), "th", after: deva_characters_1
118
+ sub "थ", "th", after: boundary
119
+
120
+ sub "द" + maybe("="), "d", after: deva_characters_1
121
+ sub "द", "d", after: boundary
122
+
123
+ sub "ध" + maybe("="), "dh", after: deva_characters_1
124
+ sub "ध", "dh", after: boundary
125
+
126
+ sub "न" + maybe("="), "n", after: deva_characters_1
127
+ sub "न", "n", after: boundary
128
+
129
+ sub "प" + maybe("="), "p", after: deva_characters_1
130
+ sub "प", "p", after: boundary
131
+
132
+ sub "फ" + maybe("="), "ph", after: deva_characters_1
133
+ sub "फ", "ph", after: boundary
134
+
135
+ sub "ब" + maybe("="), "b", after: deva_characters_1
136
+ sub "ब", "b", after: boundary
137
+
138
+ sub "भ" + maybe("="), "bh", after: deva_characters_1
139
+ sub "भ", "bh", after: boundary
140
+
141
+ sub "म" + maybe("="), "m", after: deva_characters_1
142
+ sub "म", "m", after: boundary
143
+
144
+ sub "य" + maybe("="), "y", after: deva_characters_1
145
+ sub "य", "y", after: boundary
146
+
147
+ sub "र" + maybe("="), "r", after: deva_characters_1
148
+ sub "र", "r", after: boundary
149
+
150
+ sub "ल" + maybe("="), "l", after: deva_characters_1
151
+ sub "ल", "l", after: boundary
152
+
153
+ sub "व" + maybe("="), "v", after: deva_characters_1
154
+ sub "व", "v", after: boundary
155
+
156
+ sub "श" + maybe("="), "sh", after: deva_characters_1
157
+ sub "श", "sh", after: boundary
158
+
159
+ sub "ष" + maybe("="), "ṣh", after: deva_characters_1
160
+ sub "ष", "ṣh", after: boundary
161
+
162
+ sub "स" + maybe("="), "s", after: deva_characters_1
163
+ sub "स", "s", after: boundary
164
+
165
+ sub "क़" + maybe("="), "q", after: deva_characters_1
166
+ sub "क़", "q", after: boundary
167
+
168
+ sub "ख़" + maybe("="), "ḳh", after: deva_characters_1
169
+ sub "ख़", "ḳh", after: boundary
170
+
171
+ sub "ग़" + maybe("="), "g", after: deva_characters_1
172
+ sub "ग़", "g", after: boundary
173
+
174
+ sub "ज़" + maybe("="), "z", after: deva_characters_1
175
+ sub "ज़", "z", after: boundary
176
+
177
+ sub "ड़" + maybe("="), "ṙ", after: deva_characters_1
178
+ sub "ड़", "ṙ", after: boundary
179
+
180
+ sub "ढ़" + maybe("="), "ṙh", after: deva_characters_1
181
+ sub "ढ़", "ṙh", after: boundary
182
+
183
+ sub "फ़" + maybe("="), "f", after: deva_characters_1
184
+ sub "फ़", "f", after: boundary
185
+
186
+ sub "ह" + maybe("="), "h", after: deva_characters_1
187
+ sub "ह", "h", after: boundary
188
+
189
+
190
+ # CHARACTERS
191
+ parallel {
192
+
193
+ # I. Independent vowel characters
194
+ sub "अ", "a"
195
+ sub "आ", "ā"
196
+ sub "इ", "i"
197
+ sub "ई", "ī"
198
+ sub "उ", "u"
199
+ sub "ऊ", "ū"
200
+ sub "ऋ", "ṛ"
201
+ sub "ॠ", "ṝ"
202
+ sub "ऌ", "l̤"
203
+ sub "ए", "e"
204
+ sub "ऐ", "ai"
205
+ sub "ओ", "o"
206
+ sub "औ", "au"
207
+
208
+ # II. Abbreviated vowel characters
209
+
210
+ sub "ा", "ā" # का
211
+ sub "ॉ", "ā̆ " # additional mark: कॉ
212
+ sub "ि", "i" # कि i
213
+ sub "ी", "ī" # की
214
+ sub "ु", "u" # कु
215
+ sub "ू", "ū" # कू
216
+ sub "ृ", "ṛ" # कृ
217
+ sub "े", "e" # के
218
+ sub "ै", "ai" # कै
219
+ sub "ो", "o" # को
220
+ sub "ौ", "au" # कौ
221
+
222
+
223
+ # Consonants (see Note 1)
224
+
225
+ # Gutturals
226
+ sub "क", "ka"
227
+ sub "ख", "kha"
228
+ sub "ग", "ga"
229
+ sub "घ", "gha"
230
+ sub "ङ", "ṅa"
231
+
232
+ # Palatals
233
+ sub "च", "cha"
234
+ sub "छ", "chha"
235
+ sub "ज", "ja"
236
+ sub "झ", "jha"
237
+ sub "ञ", "ña"
238
+
239
+ # Cerebrals
240
+ sub "ट", "ṭa"
241
+ sub "ठ", "ṭha"
242
+ sub "ड", "ḍa"
243
+ sub "ढ", "ḍha"
244
+ sub "ण", "ṇa"
245
+
246
+ # Dentals
247
+ sub "त", "ta"
248
+ sub "थ", "tha"
249
+ sub "द", "da"
250
+ sub "ध", "dha"
251
+ sub "न", "na"
252
+
253
+ # Labials
254
+ sub "प", "pa"
255
+ sub "फ", "pha"
256
+ sub "ब", "ba"
257
+ sub "भ", "bha"
258
+ sub "म", "ma"
259
+
260
+ # Semivowels
261
+ sub "य", "ya"
262
+ sub "र", "ra"
263
+ sub "ल", "la"
264
+ sub "व", "va"
265
+
266
+ # Sibilants
267
+ sub "श", "sha"
268
+ sub "ष", "ṣha"
269
+ sub "स", "sa"
270
+
271
+ # Dotted variants
272
+ sub "क़", "qa"
273
+ sub "ख़", "ḳha"
274
+ sub "ग़", "ġa"
275
+ sub "ज़", "za"
276
+ sub "ड़", "ṙa"
277
+ sub "ढ़", "ṙha"
278
+ sub "फ़", "fa"
279
+
280
+
281
+ # Aspirate
282
+ sub "ह", "ha"
283
+
284
+ # Anusvāra
285
+ sub "ं", "ṁ"
286
+
287
+ # Anunāsika
288
+ sub "ँ", "m̐"
289
+
290
+ # halanta
291
+ sub "्", ""
292
+
293
+ # bisharga
294
+ sub "ः", "ḥ"
295
+
296
+ #V. Ligatures(To cover all Ligatures at unicode)
297
+ # Implemnting Pronunciation without a vowel: क् k.
298
+
299
+ # Gutturals
300
+ sub "क्", "k"
301
+ sub "ख्", "kh"
302
+ sub "ग्", "g"
303
+ sub "घ्", "gh"
304
+ sub "ङ्", "ṅ"
305
+
306
+ # Palatals
307
+ sub "च्", "ch"
308
+ sub "छ्", "chh"
309
+ sub "ज्", "j"
310
+ sub "झ्", "jh"
311
+ sub "ञ्", "ñ"
312
+
313
+ # Cerebrals
314
+ sub "ट्", "ṭ"
315
+ sub "ठ्", "ṭh"
316
+ sub "ड्", "ḍ"
317
+ sub "ढ्", "ḍh"
318
+ sub "ण्", "ṇ"
319
+
320
+ # Dentals
321
+ sub "त्", "t"
322
+ sub "थ्", "th"
323
+ sub "द्", "d"
324
+ sub "ध्", "dh"
325
+ sub "न्", "n"
326
+
327
+ # Labials
328
+ sub "प्", "p"
329
+ sub "फ्", "ph"
330
+ sub "ब्", "b"
331
+ sub "भ्", "bh"
332
+ sub "म्", "m"
333
+
334
+ # Semivowels
335
+ sub "य्", "y"
336
+ sub "र्", "r"
337
+ sub "ल्", "l"
338
+ sub "व्", "v"
339
+
340
+ # Sibilants
341
+ sub "श्", "sh"
342
+ sub "ष्", "ṣh"
343
+ sub "स्", "s"
344
+
345
+ # Dotted variants
346
+ sub "क़्", "q"
347
+ sub "ख़्", "ḳh"
348
+ sub "ग़्", "ġ"
349
+ sub "ज़्", "z"
350
+ sub "ड़्", "ṙ"
351
+ sub "ढ़्", "ṙh"
352
+ sub "फ़्", "f"
353
+ }
354
+ compose
355
+ }
356
+
@@ -0,0 +1,214 @@
1
+ metadata {
2
+ authority_id: ungegn
3
+ id: 2016
4
+ language: iso-639-2:kan
5
+ source_script: Kana
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
8
+ url: https://www.eki.ee/wgrs/rom1_kn.pdf
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
13
+ (III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
14
+ published in volume II of the conference reports
15
+
16
+ There is no evidence of the use of the system either in India or in international cartographic
17
+ products.
18
+
19
+ Kannada uses an alphasyllabic script whereby each character represents a syllable rather than
20
+ one sound. Vowels and diphthongs are marked in two ways: as independent characters (used
21
+ syllable-initially) and in an abbreviated form, to denote vowels after consonants. The
22
+ romanization table is unambiguous. The system is mostly reversible but there may exist some
23
+ ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
24
+ consonants (combinations with subscript consonants vs. character sequences).
25
+
26
+ notes:
27
+ - |
28
+ While most consonants have a diacritic in the upper right corner of the character (like ಕ),
29
+ some do not, e.g. ಖ kha, ಜ ja, ನ na, ಬ ba, ಲ la.
30
+ - |
31
+ Combinations with r as the first component are written by adding a special symbol after the
32
+ second consonant: ರ್ಗ rga.
33
+ }
34
+
35
+ tests {
36
+ test "ಕರ್ಣಾಟಕ", "karṇāṭaka"
37
+ test "ಬೆಂಗಳೂರು", "bĕṁgaḷūru"
38
+ test "ಮಹಾರಾಷ್ಟ್ರದ ಯಾವುದೇ ಪ್ರಕರಣದ ತನಿಖೆಗೆ ಇನ್ನು ಸಿಬಿಐ ಪಡೆಯಬೇಕು ಅನುಮತಿ", "mahārāṣhṭrada yāvude prakaraṇada tanikhĕgĕ innu sibiai paḍĕyabeku anumati"
39
+ test "ಹರಕು ಬಾಯಿ: ಈಶ್ವರಪ್ಪಗೆ ಶಾಸಕ ಯತ್ನಾಳ ತಿರುಗೇಟು", "haraku bāyi: īshvarappagĕ shāsaka yatnāḷa tirugeṭu"
40
+ test "ಹಾಥರಸ್‌ ಪ್ರಕರಣ: ೨೯ರಂದು ರಾಷ್ಟ್ರವ್ಯಾಪಿ ಪ್ರತಿಭಟನೆಗೆ ಮಹಿಳಾ ಸಂಘಟನೆಗಳ ಕರೆ", "hātharas prakaraṇa: 29raṁdu rāṣhṭravyāpi pratibhaṭanĕgĕ mahiḷā saṁghaṭanĕgaḷa karĕ"
41
+ test "ಪೊಲೀಸ್‌ ಮಕ್ಕಳ ಶಾಲೆ ಮುಚ್ಚುವ ಯತ್ನಕ್ಕೆ ಹೊರಟ್ಟಿ ತೀವ್ರ ವಿರೋಧ", "pŏlīs makkaḷa shālĕ muchchuva yatnakkĕ hŏraṭṭi tīvra virodha"
42
+ test "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ: ಟ್ರಂಪ್‌–ಬೈಡನ್‌ ಅಂತಿಮ ಮುಖಾಮುಖಿಗೆ ವೇದಿಕೆ ಸಿದ್ಧ", "amĕrika adhyakṣhīya chunāvaṇĕ: ṭraṁp–baiḍan aṁtima mukhāmukhigĕ vedikĕ siddha"
43
+ test "ಅಂಜನಾದ್ರಿ ಆಂಜನೇಯನ ದರ್ಶನ ಪಡೆದ ಪವರ್ ಸ್ಟಾರ್ ಪುನೀತ್ ರಾಜ್ ಕುಮಾರ್", "aṁjanādri āṁjaneyana darshana paḍĕda pavar sṭār punīt rāj kumār"
44
+ test "ಇನ್ನು ಹಿಂದೂ ದೇವಸ್ಥಾನದ ಧಾರ್ಮಿಕ ಕಾರ್ಯದಲ್ಲಿ ಭಾಗಿಯಾಗಿದ್ದಕ್ಕೆ ಮೋಯಿದ್ದೀನ್ ಬಾವಾಗೆ ಬೆದರಿಕೆ ಒಡ್ಡಲಾಗಿದೆ", "innu hiṁdū devasthānada dhārmika kāryadalli bhāgiyāgiddakkĕ moyiddīn bāvāgĕ bĕdarikĕ ŏḍḍalāgidĕ"
45
+ test "ಇದು ಮೋದಿ ದೇಶ - ದನ ತಿಂದು ಹೋದ್ರೆ ಹುಷಾರ್ : ದೇಗುಲಕ್ಕೆ ಹೋಗಿದ್ದ ಬಾವಾಗೆ ಬೆದರಿಕೆ", "idu modi desha - dana tiṁdu hodrĕ huṣhār : degulakkĕ hogidda bāvāgĕ bĕdarikĕ"
46
+ }
47
+
48
+ aliases {
49
+ def_alias characters_set1, any("\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd")
50
+ }
51
+
52
+ stage {
53
+
54
+ # RULES
55
+ # to cover diacritic and vowel less consonants
56
+ sub "ಕ", "k", after: characters_set1
57
+ sub "ಖ", "kh", after: characters_set1
58
+ sub "ಗ", "g", after: characters_set1
59
+ sub "ಘ", "gh", after: characters_set1
60
+ sub "ಙ", "ṅ", after: characters_set1
61
+ sub "ಚ", "ch", after: characters_set1
62
+ sub "ಛ", "chh", after: characters_set1
63
+ sub "ಜ", "j", after: characters_set1
64
+ sub "ಝ", "jh", after: characters_set1
65
+ sub "ಞ", "ñ", after: characters_set1
66
+ sub "ಟ", "ṭ", after: characters_set1
67
+ sub "ಠ", "ṭh", after: characters_set1
68
+ sub "ಡ", "ḍ", after: characters_set1
69
+ sub "ಢ", "ḍh", after: characters_set1
70
+ sub "ಣ", "ṇ", after: characters_set1
71
+ sub "ತ", "t", after: characters_set1
72
+ sub "ಥ", "th", after: characters_set1
73
+ sub "ದ", "d", after: characters_set1
74
+ sub "ಧ", "dh", after: characters_set1
75
+ sub "ನ", "n", after: characters_set1
76
+ sub "ಪ", "p", after: characters_set1
77
+ sub "ಫ", "ph", after: characters_set1
78
+ sub "ಬ", "b", after: characters_set1
79
+ sub "ಭ", "bh", after: characters_set1
80
+ sub "ಮ", "m", after: characters_set1
81
+ sub "ಯ", "y", after: characters_set1
82
+ sub "ರ", "r", after: characters_set1
83
+ sub "ಲ", "l", after: characters_set1
84
+ sub "ಳ", "ḷ", after: characters_set1
85
+ sub "ವ", "v", after: characters_set1
86
+ sub "ಶ", "sh", after: characters_set1
87
+ sub "ಷ", "ṣh", after: characters_set1
88
+ sub "ಸ", "s", after: characters_set1
89
+ sub "ಹ", "h", after: characters_set1
90
+
91
+
92
+ # CHARACTERS
93
+ parallel {
94
+ sub "ಅ", "a"
95
+ sub "ಆ", "ā"
96
+ sub "ಇ", "i"
97
+ sub "ಈ", "ī"
98
+ sub "ಉ", "u"
99
+ sub "ಊ", "ū"
100
+ sub "ಋ", "ṛ"
101
+
102
+ sub "ಎ", "ĕ"
103
+ sub "ಏ", "e"
104
+ sub "ಐ", "ai"
105
+
106
+ sub "ಒ", "ŏ"
107
+ sub "ಓ", "o"
108
+ sub "ಔ", "au"
109
+
110
+ # Gutturals
111
+ sub "ಕ", "ka"
112
+ sub "ಖ", "kha"
113
+ sub "ಗ", "ga"
114
+ sub "ಘ", "gha"
115
+ sub "ಙ", "ṅa"
116
+
117
+ # Palatals
118
+ sub "ಚ", "cha"
119
+ sub "ಛ", "chha"
120
+ sub "ಜ", "ja"
121
+ sub "ಝ", "jha"
122
+ sub "ಞ", "ña"
123
+
124
+ # Cerebrals
125
+ sub "ಟ", "ṭa"
126
+ sub "ಠ", "ṭha"
127
+ sub "ಡ", "ḍa"
128
+ sub "ಢ", "ḍha"
129
+ sub "ಣ", "ṇa"
130
+
131
+ # Dentals
132
+ sub "ತ", "ta"
133
+ sub "ಥ", "tha"
134
+ sub "ದ", "da"
135
+ sub "ಧ", "dha"
136
+ sub "ನ", "na"
137
+
138
+ # Labials
139
+ sub "ಪ", "pa"
140
+ sub "ಫ", "pha"
141
+ sub "ಬ", "ba"
142
+ sub "ಭ", "bha"
143
+ sub "ಮ", "ma"
144
+
145
+ # Semivowels
146
+ sub "ಯ", "ya"
147
+ sub "ರ", "ra"
148
+ sub "ಲ", "la"
149
+ sub "ಳ", "ḷa"
150
+
151
+
152
+ sub "ವ", "va"
153
+
154
+ # Sibilants
155
+ sub "ಶ", "sha"
156
+ sub "ಷ", "ṣha"
157
+ sub "ಸ", "sa"
158
+
159
+
160
+ # Aspirate
161
+ sub "ಹ", "ha"
162
+
163
+
164
+ # Bisarga
165
+ sub "ಃ", "ḥ"
166
+
167
+ # Anusvāra
168
+ sub "ಂ", "ṁ"
169
+
170
+ sub "\u0cbc", "" #nukta
171
+
172
+ # Medials # Needed for connecting constants
173
+ sub "ಾ", "ā"
174
+ sub "ಿ", "i"
175
+ sub "ೀ", "ī"
176
+ sub "ು", "u"
177
+ sub "ೂ", "ū"
178
+ sub "ೃ", "ṛ"
179
+
180
+
181
+ sub "ೆ", "ĕ"
182
+ sub "ೇ", "e"
183
+ sub "ೈ", "ai"
184
+
185
+
186
+ sub "ೊ", "ŏ"
187
+ sub "ೋ", "o"
188
+ sub "ೌ", "au"
189
+
190
+
191
+ sub "्", ""
192
+ sub "़", ""
193
+ sub "್", "" # used for pronounciation without vowel
194
+ sub "‍", "" # no need for zero with joiner
195
+ sub "‌", "" # no need for zero with non joiner
196
+
197
+
198
+
199
+ # Digits
200
+
201
+ sub "೦", "0"
202
+ sub "೧", "1"
203
+ sub "೨", "2"
204
+ sub "೩", "3"
205
+ sub "೪", "4"
206
+ sub "೫", "5"
207
+ sub "೬", "6"
208
+ sub "೭", "7"
209
+ sub "೮", "8"
210
+ sub "೯", "9"
211
+ }
212
+
213
+ compose
214
+ }