interscript 0.1.3 → 0.1.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (294) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +10 -11
  3. data/aliases.json +1 -0
  4. data/lib/interscript.rb +62 -59
  5. data/lib/interscript/command.rb +3 -2
  6. data/lib/interscript/fs.rb +96 -0
  7. data/lib/interscript/mapping.rb +36 -17
  8. data/lib/interscript/opal.rb +196 -0
  9. data/lib/interscript/opal/entrypoint.rb +20 -0
  10. data/lib/interscript/opal/exports.rb +11 -0
  11. data/lib/interscript/opal/maps.js.erb +8 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/maps/acadsin-zho-Hani-Latn-2002.yaml +6 -2
  14. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  15. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  16. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  17. data/maps/alalc-asm-Deva-Latn-1997.yaml +259 -0
  18. data/maps/alalc-asm-Deva-Latn-2012.yaml +55 -0
  19. data/maps/alalc-aze-Arab-Latn-1997.yaml +376 -0
  20. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  21. data/maps/{alalc-bel-cyrl-latn-1997.yaml → alalc-bel-Cyrl-Latn-1997.yaml} +7 -3
  22. data/maps/alalc-ben-Beng-Latn-1997.yaml +291 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  25. data/maps/alalc-div-Thaa-Latn-1997.yaml +211 -0
  26. data/maps/alalc-ell-Grek-Latn-1997.yaml +7 -4
  27. data/maps/alalc-ell-Grek-Latn-2010.yaml +3 -5
  28. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  29. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  30. data/maps/alalc-hin-Deva-Latn-1997.yaml +303 -0
  31. data/maps/alalc-hin-Deva-Latn-2011.yaml +65 -0
  32. data/maps/alalc-kan-Kana-Latn-1997.yaml +274 -0
  33. data/maps/alalc-kan-Kana-Latn-2011.yaml +63 -0
  34. data/maps/alalc-kat-Geok-Latn-1997.yaml +2 -3
  35. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  36. data/maps/alalc-kor-Hang-Latn-1997.yaml +6 -2
  37. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  38. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  39. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  40. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  41. data/maps/{alalc-mkd-cyrl-latn-1997.yaml → alalc-mkd-Cyrl-Latn-1997.yaml} +1 -1
  42. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  43. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  44. data/maps/alalc-ori-Orya-Latn-1997.yaml +284 -0
  45. data/maps/alalc-ori-Orya-Latn-2011.yaml +67 -0
  46. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  47. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  48. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  49. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  50. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  51. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  52. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  53. data/maps/alalc-san-Deva-Latn-2012.yaml +241 -0
  54. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  55. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  56. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  57. data/maps/{alalc-srp-cyrl-latn-2013.yaml → alalc-srp-Cyrl-Latn-2013.yaml} +1 -1
  58. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  59. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  60. data/maps/alalc-tel-Telu-Latn-1997.yaml +284 -0
  61. data/maps/alalc-tel-Telu-Latn-2011.yaml +64 -0
  62. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  63. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  64. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  65. data/maps/az-aze-Cyrl-Latn-1939.yaml +105 -0
  66. data/maps/az-aze-Cyrl-Latn-1958.yaml +45 -0
  67. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -2
  68. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  69. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -3
  70. data/maps/bgn-kor-Hang-Latn-1943.yaml +8 -4
  71. data/maps/bgn-kor-Kore-Latn-1943.yaml +4 -4
  72. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  73. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  75. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +598 -0
  76. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  77. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +111 -104
  78. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  79. data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +329 -0
  80. data/maps/{bgnpcgn-bel-cyrl-latn-1979.yaml → bgnpcgn-bel-Cyrl-Latn-1979.yaml} +5 -1
  81. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +14 -10
  82. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  83. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  84. data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +75 -0
  85. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +8 -5
  86. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -2
  87. data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +28 -0
  88. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  89. data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +37 -0
  90. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  91. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  92. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -2
  93. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +247 -0
  94. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +218 -0
  95. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +18 -18
  96. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +3 -3
  97. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +3 -3
  98. data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +249 -0
  99. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  100. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +2 -2
  101. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  102. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  103. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +338 -0
  104. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +673 -0
  105. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  106. data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +377 -0
  107. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  108. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  109. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +73 -0
  110. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  111. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  112. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  113. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -2
  114. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  115. data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +459 -0
  116. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  117. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  118. data/maps/{bgnpcgn-chn-Hans-Latn-1979.yaml → bgnpcgn-zho-Hans-Latn-1979.yaml} +1 -1
  119. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  120. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  121. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  122. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  123. data/maps/bis-kan-Kana-Latn-13194-1991.yaml +173 -0
  124. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  125. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +175 -0
  126. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  127. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  128. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  129. data/maps/by-bel-Cyrl-Latn-1998.yaml +9 -5
  130. data/maps/by-bel-Cyrl-Latn-2007.yaml +4 -4
  131. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  132. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  133. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  134. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  135. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  136. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  137. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  138. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  139. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  140. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  141. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +7 -8
  142. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +6 -7
  143. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -3
  144. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -3
  145. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -2
  146. data/maps/{gki-bel-cyrl-latn-1992.yaml → gki-bel-Cyrl-Latn-1992.yaml} +2 -2
  147. data/maps/{gki-bel-cyrl-latn-2000.yaml → gki-bel-Cyrl-Latn-2000.yaml} +2 -2
  148. data/maps/{gost-rus-cyrl-latn-16876-71-1983.yaml → gost-rus-Cyrl-Latn-16876-71-1983.yaml} +8 -4
  149. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  150. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  151. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -6
  152. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -5
  153. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -2
  154. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  155. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  156. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -2
  157. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  158. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -2
  159. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  160. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  161. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  162. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +11 -8
  163. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -5
  164. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  165. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  166. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  167. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  168. data/maps/iso-kan-Kana-Latn-15919-2001.yaml +220 -0
  169. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  170. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  171. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  172. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  173. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  174. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  175. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  176. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  177. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  178. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  179. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  180. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  181. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  182. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  183. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -4
  184. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  185. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  186. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  187. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +2 -2
  188. data/maps/kp-kor-Hang-Latn-2002.yaml +29 -21
  189. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +3 -3
  190. data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  191. data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  192. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  193. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  194. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  195. data/maps/mv-div-Thaa-Latn-1987.yaml +200 -0
  196. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  197. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  198. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  199. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  200. data/maps/odni-ara-Arab-Latn-2004.yaml +137 -0
  201. data/maps/odni-ara-Arab-Latn-2015.yaml +315 -0
  202. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  203. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  204. data/maps/odni-bul-Cyrl-Latn-2005.yaml +90 -0
  205. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  206. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  207. data/maps/odni-fas-Arab-Latn-2004.yaml +276 -0
  208. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  209. data/maps/odni-hin-Deva-Latn-2004.yaml +182 -0
  210. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  211. data/maps/odni-kat-Geor-Latn-2015.yaml +2 -3
  212. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  213. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  214. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  215. data/maps/odni-mkd-Cyrl-Latn-2005.yaml +21 -0
  216. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  217. data/maps/odni-prs-Arab-Latn-2004.yaml +123 -0
  218. data/maps/odni-prs-Arab-Latn-2015.yaml +228 -0
  219. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  220. data/maps/odni-srp-Cyrl-Latn-2005.yaml +36 -0
  221. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  222. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  223. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  224. data/maps/odni-tuk-Cyrl-Latn-2015.yaml +170 -0
  225. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  226. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +6 -2
  227. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  228. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  229. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +5 -5
  230. data/maps/royin-tha-Thai-Latn-1968.yaml +9 -5
  231. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +5 -5
  232. data/maps/royin-tha-Thai-Latn-1999.yaml +8 -4
  233. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  234. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  235. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  236. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  237. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  238. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  239. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  240. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  241. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  242. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  243. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  244. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  245. data/maps/un-asm-Beng-Latn-1972.yaml +223 -0
  246. data/maps/un-bel-Cyrl-Latn-2007.yaml +4 -4
  247. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  248. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +44 -44
  249. data/maps/un-ell-Grek-Latn-1987-tl.yaml +3 -4
  250. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -4
  251. data/maps/un-guj-Gujr-Latn-1972.yaml +229 -0
  252. data/maps/un-hin-Deva-Latn-2016.yaml +316 -0
  253. data/maps/un-kan-Kana-Latn-2016.yaml +254 -0
  254. data/maps/un-mal-Mlym-Latn-1972.yaml +251 -0
  255. data/maps/un-mar-Deva-Latn-2016.yaml +102 -0
  256. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  257. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  258. data/maps/un-nep-Deva-Latn-1972.yaml +269 -0
  259. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  260. data/maps/un-ori-Orya-Latn-1972.yaml +247 -0
  261. data/maps/un-pan-Guru-Latn-1972.yaml +402 -0
  262. data/maps/un-prs-Arab-Latn-1967.yaml +236 -0
  263. data/maps/un-rus-Cyrl-Latn-1987.yaml +2 -2
  264. data/maps/un-tam-Taml-Latn-1972.yaml +194 -0
  265. data/maps/un-tel-Telu-Latn-1972.yaml +270 -0
  266. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  267. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  268. data/maps/un-urd-Arab-Latn-1972.yaml +405 -0
  269. data/maps/var-amh-Ethi-Latn-eae-2003.yaml +466 -0
  270. data/maps/var-gez-Ethi-Latn-eae-2003.yaml +76 -0
  271. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  272. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  273. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  274. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +4 -4
  275. data/maps/var-kor-Hang-Latn-mr-1939.yaml +4 -4
  276. data/maps/var-kor-Kore-Hang-2013.yaml +2 -2
  277. data/maps/var-kor-Kore-Latn-mr-1939.yaml +2 -3
  278. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  279. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  280. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  281. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  282. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  283. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  284. data/maps/var-tha-Thai-Thai-phonemic.yaml +6 -6
  285. data/maps/var-tha-Thai-Zsym-ipa.yaml +13 -13
  286. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +13 -9
  287. data/spec/interscript/filenames_spec.rb +21 -0
  288. data/spec/interscript_spec.rb +16 -5
  289. metadata +275 -27
  290. data/bin/interscript +0 -41
  291. data/bin/rspec +0 -29
  292. data/bin/setup +0 -8
  293. data/maps/un-mon-Mong-Latn-2013.yaml +0 -93
  294. data/maps/un-ukr-cyrl-latn-1998.yaml +0 -30
@@ -0,0 +1,64 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:guj
5
+ source_script: Gujr
6
+ destination_script: Latn
7
+ name: Gujarati Romanization, 2011
8
+ alias:
9
+ ogc11122:
10
+ code: guj_Gujr2Latn_ALA_2011
11
+ description: Gujarati ALA-Library of Congress 2011 System
12
+ url: https://www.loc.gov/catdir/cpso/romanization/gujarati.pdf
13
+ creation_date: 2011
14
+ description: |
15
+ ALA-LC Romanization table for Gujarati
16
+
17
+ notes:
18
+
19
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
20
+ vowels following a consonant can be found in grammars; no distinction between the two is
21
+ made in transliteration.
22
+
23
+ - |
24
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
25
+ transliteration, with the following exceptions:
26
+ a) when another vowel is indicated by its appropriate sign and
27
+ b) when the absence of any vowel is indicated by the subscript symbol ( ્ ) called halanta or
28
+ virāma.
29
+
30
+ - |
31
+ Exception: Anusvāra is transliterated by:
32
+ a) ṅ before gutturals,
33
+ b) ñ before palatals,
34
+ c) ṇ before cerebrals,
35
+ d) n before dentals, and
36
+ e) m before labials.
37
+
38
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
39
+
40
+ tests:
41
+ - source: "મોર્ગન અને રસેલ ફ્લોપ રહ્યા"
42
+ expected: "mȏrgana anȇ rasȇla phlȏpa rahyā"
43
+ - source: "રોયલ ચેલેન્જર્સ બેંગલોરના કેપ્ટન વિરાટ કોહલીએ કોલકાતા નાઈટ રાઈડર્સ સામે શારજાહ ખાતે ટોસ જીતીને બેટિંગ લીધી છે."
44
+ expected: "rȏyala cȇlȇnjarsa bȇṅgalȏranā kȇpṭana virāṭa kȏhalīȇ kȏlakātā nāīṭa rāīḍarsa sāmȇ śārajāha khātȇ ṭȏsa jītīnȇ bȇṭiṅga līdhī chȇ."
45
+ - source: "અમદાવાદમાં ભણી ચૂકેલા શ્રીકાંત દાતાર પ્રતિષ્ઠિત હાર્વર્ડ બિઝનેસ સ્કૂલના ડીન બન્યા"
46
+ expected: "amadāvādamāṃ bhaṇī cūkȇlā śrīkānta dātāra pratishṭhita hārvarḍa bijhanȇsa skūlanā ḍīna banyā"
47
+ - source: "ઓગસ્ટ મહિનામાં મેન્યુફેક્ચરિંગ સેક્ટરનું ઉત્પાદન ગગડ્યુ"
48
+ expected: "ȏgasṭa mahināmāṃ mȇnyuphȇkcariṅga sȇkṭaranuṃ utpādana gagaḍyu"
49
+ - source: "૯૦ વર્ષમાં બે કરોડમાંથી પોણાબે લાખ કરોડ થઈ ગઈ ટાટા ગ્રુપમાં મિસ્ત્રી પરિવારની શેર્સ વેલ્યુ, જૂના સંબંધો અંત ભણી, જાણો કોને શું મળશે, કોણ શું ગુમાવશે?"
50
+ expected: "90 varshamāṃ bȇ karȏḍamānthī pȏṇābȇ lākha karȏḍa thaī gaī ṭāṭā grupamāṃ mistrī parivāranī śȇrsa vȇlyu, jūnā sambandhȏ anta bhaṇī, jāṇȏ kȏnȇ śuṃ maḷaśȇ, kȏṇa śuṃ gumāvaśȇ?"
51
+ - source: "મુંબઈના એક સ્ટોક બ્રોકરે જણાવ્યું કે ટાટા પોતાના શેર બહાર જતા રોકવા માટે SP ગ્રુપ સાથે સમજૂતી કરી શકે છે."
52
+ expected: "mumbaīnā ȇka sṭȏka brȏkarȇ jaṇāvyuṃ kȇ ṭāṭā pȏtānā śȇra bahāra jatā rȏkavā māṭȇ SP grupa sāthȇ samajūtī karī śakȇ chȇ."
53
+ - source: "કોલકાતા નાઈટ રાઈડર્સનો ઓફ સ્પિનર સુનીલ નારાયણ વિવાદમાં ફસાઈ ગયો છે"
54
+ expected: "kȏlakātā nāīṭa rāīḍarsanȏ ȏpha spinara sunīla nārāyaṇa vivādamāṃ phasāī gayȏ chȇ"
55
+ - source: "ટાટા અને મિસ્ત્રી પરિવાર વચ્ચે શેર્સની આપ-લે થાય એ માટે કોઈ પારસી વ્યક્તિને મધ્યસ્થી બનાવી શકાય છે અને આ માટે રતન ટાટા પણ પ્રયત્નો કરી શકે છે"
56
+ expected: "ṭāṭā anȇ mistrī parivāra vaccȇ śȇrsanī āpa-lȇ thāya ȇ māṭȇ kȏī pārasī vyaktinȇ madhyasthī banāvī śakāya chȇ anȇ ā māṭȇ ratana ṭāṭā paṇa prayatnȏ karī śakȇ chȇ"
57
+ - source: "મેદાની અમ્પાયરોએ પંજાબ વિરુદ્ધની મેચમાં તેની બોલિંગ એક્શન બાબતે શંકા વ્યક્ત કરી હતી. ફરિયાદ પછી હવે નારાયણને વોર્નિંગ લિસ્ટમાં નાખી દેવાયો છે"
58
+ expected: "mȇdānī ampāyarȏȇ pañjāba viruddhanī mȇcamāṃ tȇnī bȏliṅga ȇkśana bābatȇ śaṅkā vyakta karī hatī. phariyāda pachī havȇ nārāyaṇanȇ vȏrniṅga lisṭamāṃ nākhī dȇvāyȏ chȇ"
59
+ - source: "મોદી સરકારના આત્મનિર્ભર ભારત અભિયાનને સફળતા, પાંચ મહિનામાં ચીન સાથેની વેપાર ખાધ અડધી થઈ ગઈ, ચાઈનિઝ સ્માર્ટફોનની હિસ્સેદારી પણ ઘટી"
60
+ expected: "mȏdī sarakāranā ātmanirbhara bhārata abhiyānanȇ saphaḷatā, pāñca mahināmāṃ cīna sāthȇnī vȇpāra khādha aḍadhī thaī gaī, cāīnijha smārṭaphȏnanī hissȇdārī paṇa ghaṭī"
61
+
62
+ map:
63
+
64
+ inherit: 'alalc-guj-Gujr-Latn-1997'
@@ -0,0 +1,303 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Hindi Romanization, 1997
8
+ alias:
9
+ ogc11122:
10
+ code: hin_Deva2Latn_ALA_1997
11
+ description: Hindi ALA-Library of Congress 1997 System
12
+ url: http://catdir.loc.gov/catdir/cpso/romanization/hindi.pdf
13
+ creation_date: 1997
14
+ description: |
15
+ ALA-LC Romanization table for Hindi
16
+
17
+ notes:
18
+
19
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
20
+ vowels following a consonant can be found in grammars; no distinction between the two is
21
+ made in transliteration.
22
+
23
+ - |
24
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
25
+ transliteration, with the following exceptions:
26
+
27
+ a) when another vowel is indicated by its appropriate sign; and
28
+ b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
29
+ virāma.
30
+
31
+ - |
32
+ Exception: Anusvāra is transliterated by:
33
+
34
+ a) ṅ before gutturals,
35
+ b) ñ before palatals,
36
+ c) ṇ before cerebrals,
37
+ d) n before dentals, and
38
+ e) m before labials.
39
+
40
+ - Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
41
+ labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
42
+
43
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
44
+
45
+ tests:
46
+ - source: "हम"
47
+ expected: "hama"
48
+ - source: "मीन"
49
+ expected: "mīna"
50
+ - source: "औसत"
51
+ expected: "ăusata"
52
+ - source: "माँऽऽऽ!"
53
+ expected: "mān̐’’’!"
54
+ - source: "माँ"
55
+ expected: "mām̐"
56
+ - source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
57
+ expected: "gaṃbhīr marījoṃ ke māmale meṃ bhārat dūsare naṃbar para"
58
+ - source: "कोरोना अपडेट्स"
59
+ expected: "koronā apaḍeṭsa"
60
+ - source: "सीडीसी चीफ का बयान अहम"
61
+ expected: "sīḍīsī cīph kā bayān ahama"
62
+ - source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
63
+ expected: "gūgal ple sṭor par peṭīem kī vāpasī"
64
+ - source: "भारत में गैंबलिंग की इजाजत नहीं"
65
+ expected: "bhārat meṃ gaiṃbaliṃg kī ijājat nahīṃ"
66
+ - source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
67
+ expected: "koronā vaiksīn mudde par ghire rāshṭrapati; jo bāiḍen bole- mujhe ăur deś ko vaijñānikoṃ par bharosā hai, ḍonālḍ ṭramp par nahīṃ"
68
+ - source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
69
+ expected: "gūgal kī kārravāī par peṭīem ne kahā thā ki aip ko asthāyī tăur par ple-sṭor se haṭāyā gayā hai, āpake paise surakshit haiṃ"
70
+ - source: "२५६८७५४४६४४६१६११"
71
+ expected: "2568754464461611"
72
+
73
+ map:
74
+
75
+ rules:
76
+ # note[2]
77
+ - pattern: (क=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
78
+ result: 'k'
79
+ - pattern: (क़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
80
+ result: 'q'
81
+ - pattern: (ख=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
82
+ result: 'kh'
83
+ - pattern: (ख़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
84
+ result: 'kh'
85
+ - pattern: (ग=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
86
+ result: 'g'
87
+ - pattern: (ग़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
88
+ result: 'gh'
89
+ - pattern: (घ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
90
+ result: 'gh'
91
+ - pattern: (ङ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
92
+ result: 'ṅ'
93
+ - pattern: (च=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
94
+ result: 'c'
95
+ - pattern: (छ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
96
+ result: 'ch'
97
+ - pattern: (ज=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
98
+ result: 'j'
99
+ - pattern: (ज़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
100
+ result: 'j'
101
+ - pattern: (झ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
102
+ result: 'jh'
103
+ - pattern: (ञ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
104
+ result: 'ñ'
105
+ - pattern: (ट=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
106
+ result: 'ṭ'
107
+ - pattern: (ट़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
108
+ result: 't̤'
109
+ - pattern: (ठ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
110
+ result: 'ṭh'
111
+ - pattern: (ड=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
112
+ result: 'ḍ'
113
+ - pattern: (ड़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
114
+ result: 'ṛ'
115
+ - pattern: (ड़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
116
+ result: 'ṛ'
117
+ - pattern: (ढ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
118
+ result: 'ḍh'
119
+ - pattern: (ढ़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
120
+ result: 'ṛh'
121
+ - pattern: (ण=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
122
+ result: 'ṇ'
123
+ - pattern: (त=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
124
+ result: 't'
125
+ - pattern: (थ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
126
+ result: 'th'
127
+ - pattern: (द=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
128
+ result: 'd'
129
+ - pattern: (ध=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
130
+ result: 'dh'
131
+ - pattern: (न=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
132
+ result: 'n'
133
+ - pattern: (प=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
134
+ result: 'p'
135
+ - pattern: (फ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
136
+ result: 'ph'
137
+ - pattern: (फ़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
138
+ result: 'ph'
139
+ - pattern: (ब=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
140
+ result: 'b'
141
+ - pattern: (भ=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
142
+ result: 'bh'
143
+ - pattern: (म=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
144
+ result: 'm'
145
+ - pattern: (य=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
146
+ result: 'y'
147
+ - pattern: (र=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
148
+ result: 'r'
149
+ - pattern: (ल=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
150
+ result: 'l'
151
+ - pattern: (व=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
152
+ result: 'v'
153
+ - pattern: (श=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
154
+ result: 'ś'
155
+ - pattern: (ष=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
156
+ result: 'sh'
157
+ - pattern: (स=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
158
+ result: 's'
159
+ - pattern: (स़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
160
+ result: 's̤'
161
+ - pattern: (ह=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
162
+ result: 'h'
163
+ - pattern: (ह़=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
164
+ result: 'h'
165
+
166
+ # note[3]
167
+ - pattern: \u0902(?=[कक़खख़गग़घङ])
168
+ result: ṅ
169
+ - pattern: \u0902(?=[चछजज़झञ])
170
+ result: ñ
171
+ - pattern: \u0902(?=[टट़ठडड़ढढ़ण])
172
+ result: ṇ
173
+ - pattern: \u0902(?=[तथदधन])
174
+ result: n
175
+ # note[4]
176
+ - pattern: (?<=)\u0901(?=\b)
177
+ result: "m̐"
178
+
179
+ characters:
180
+
181
+ # I. Vowels and Diphthongs (see Note 1)
182
+
183
+ 'अ': 'a'
184
+ 'आ': 'ā'
185
+ 'इ': 'i'
186
+ 'ई': 'ī'
187
+ 'उ': 'u'
188
+ 'ऊ': 'ū'
189
+ 'ऋ': 'ṛ'
190
+ 'ॠ': 'ṝ'
191
+ 'ऌ': 'ḷ'
192
+ 'ॳ': 'ĕ'
193
+ 'ए': 'e'
194
+ 'ॲ': 'ê'
195
+ 'अै': 'ăi'
196
+ 'ऐ': 'ai'
197
+ 'ऒ': 'ŏ'
198
+ 'ओ': 'o'
199
+ 'ऑ': 'ô'
200
+ 'औ': 'ău'
201
+
202
+ # II. Consonants (see Note 2)
203
+ # Gutturals
204
+ 'क': 'ka'
205
+ 'क़': 'qa'
206
+ 'ख': 'kha'
207
+ 'ख़': 'kha'
208
+ 'ग': 'ga'
209
+ 'ग़': 'gha'
210
+ 'घ': 'gha'
211
+ 'ङ': 'ṅa'
212
+
213
+ # Palatals
214
+ 'च': 'ca'
215
+ 'छ': 'cha'
216
+ 'ज': 'ja'
217
+ 'ज़': 'ja'
218
+ 'झ': 'jha'
219
+ 'ञ': 'ña'
220
+
221
+ # Cerebrals
222
+ 'ट': 'ṭa'
223
+ 'ट़': 't̤a'
224
+ 'ठ': 'ṭha'
225
+ 'ड': 'ḍa'
226
+ 'ड़': 'ṛa'
227
+ 'ड़': 'ṛa'
228
+ 'ढ': 'ḍha'
229
+ 'ढ़': 'ṛha'
230
+ 'ण': 'ṇa'
231
+
232
+ # Dentals
233
+ 'त': 'ta'
234
+ 'थ': 'tha'
235
+ 'द': 'da'
236
+ 'ध': 'dha'
237
+ 'न': 'na'
238
+
239
+ # Labials
240
+ 'प': 'pa'
241
+ 'फ': 'pha'
242
+ 'फ़': 'pha'
243
+ 'ब': 'ba'
244
+ 'भ': 'bha'
245
+ 'म': 'ma'
246
+
247
+ # Semivowels
248
+ 'य': 'ya'
249
+ 'र': 'ra'
250
+ 'ल': 'la'
251
+ 'व': 'va'
252
+
253
+ # Sibilants
254
+ 'श': 'śa'
255
+ 'ष': 'sha'
256
+ 'स': 'sa'
257
+ 'स़': 's̤a'
258
+
259
+ # Aspirate
260
+ 'ह': 'ha'
261
+ 'ह़': 'ha'
262
+
263
+ # Anusvāra
264
+ 'ं': 'ṃ'
265
+
266
+ # Bisarga
267
+ 'ः ': 'ḥ'
268
+
269
+ # Anunāsika
270
+ 'ँ': 'n̐' # ঁ : n̐, m̐
271
+
272
+ # Abagraha
273
+ 'ऽ': '’' # (apostrophe)
274
+
275
+ # Medials # Needed for connecting constants
276
+ 'ा': "ā"
277
+ 'ॉ': "ô"
278
+ 'ि': "i"
279
+ 'ी': "ī"
280
+ 'ु': "u"
281
+ 'ू': "ū"
282
+ 'ृ': "ṛ"
283
+ 'ॄ': "ṝ"
284
+ 'े': "e"
285
+ 'ॊ': "ŏ"
286
+ 'ौ': "ău"
287
+ 'ै': "ai"
288
+ 'ो': "o"
289
+ '्': ""
290
+ '़': ""
291
+
292
+ # digits
293
+
294
+ '०': '0'
295
+ '१': '1'
296
+ '२': '2'
297
+ '३': '3'
298
+ '४': '4'
299
+ '५': '5'
300
+ '६': '6'
301
+ '७': '7'
302
+ '८': '8'
303
+ '९': '9'
@@ -0,0 +1,65 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Hindi Romanization, 2011
8
+ url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Hindi
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+
36
+ - Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
37
+ labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
38
+
39
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
40
+
41
+ tests:
42
+ - source: "इस चुनौतीपूर्ण समय में 'वर्क फ्रॉम होम’ सामान्य बन चुका है"
43
+ expected: "is cunăutīpūrṇ samay meṃ 'vark phrôm homa’ sāmāny ban cukā hai"
44
+ - source: "दिल्ली में त्योहार पर खरीददारी करने निकले बड़ी संख्या में लोग, कई जगहों पर लगा भीषण जाम"
45
+ expected: "dillī meṃ tyohār par kharīdadārī karane nikale baṛī saṃkhyā meṃ loga, kaī jagahoṃ par lagā bhīshaṇ jāma"
46
+ - source: "सरकार ने पेंशन भोगियों को लाइफ सर्टिफिकेट जमा कराने के मामले में दी बड़ी राहत"
47
+ expected: "sarakār ne peṃśan bhogiyoṃ ko lāiph sarṭiphikeṭ jamā karāne ke māmale meṃ dī baṛī rāhata"
48
+ - source: "कांग्रेस ने माना उसके लचर प्रदर्शन ने डुबोई महागठबंधन की लुटिया, पार्टी में उठने लगी आत्ममंथन की आवाज"
49
+ expected: "kāṃgres ne mānā usake lacar pradarśan ne ḍuboī mahāgaṭhabandhan kī luṭiyā, pārṭī meṃ uṭhane lagī ātmamanthan kī āvāja"
50
+ - source: "डिजिटल पेमेंट सिस्टम ने छोटे-मध्यम कारोबारों का दिया साथ, कोरोना की परेशानियों को किया कम"
51
+ expected: "ḍijiṭal pemeṃṭ sisṭam ne choṭe-madhyam kārobāroṃ kā diyā sātha, koronā kī pareśāniyoṃ ko kiyā kama"
52
+ - source: "छोटे व्यापारियों को ढूंढें, उनसे खरीदें और उनका साथ दें"
53
+ expected: "choṭe vyāpāriyoṃ ko ḍhūṃḍheṃ, unase kharīdeṃ ăur unakā sāth deṃ"
54
+ - source: "भारत के साथ साझीदारी को महत्व देंगे बाइडन, ओबामा प्रशासन में रहीं वरिष्ठ अधिकारी एलिसा ने जताई उम्मीद"
55
+ expected: "bhārat ke sāth sājhīdārī ko mahatv deṃge bāiḍana, obāmā praśāsan meṃ rahīṃ varishṭh adhikārī elisā ne jatāī ummīda"
56
+ - source: "दो महीने से कोमा में था युवक, चिकन की चर्चा सुनते ही आया होश"
57
+ expected: "do mahīne se komā meṃ thā yuvaka, cikan kī carcā sunate hī āyā hośa"
58
+ - source: "कोरोना के टीके पर खुशखबरी, भारत पहुंची रूसी वैक्सीन की पहली खेप"
59
+ expected: "koronā ke ṭīke par khuśakhabarī, bhārat pahuṃcī rūsī vaiksīn kī pahalī khepa"
60
+ - source: "दिल्ली के गांधी नगर स्थित एक दुकान में लगी भीषण आग, दमकल की 20 गाड़ियां मौके पर"
61
+ expected: "dillī ke gāṃdhī nagar sthit ek dukān meṃ lagī bhīshaṇ āga, damakal kī 20 gāṛiyāṃ măuke para"
62
+
63
+ map:
64
+
65
+ inherit: "alalc-hin-Deva-Latn-1997"
@@ -0,0 +1,274 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:kan
5
+ source_script: Kana
6
+ destination_script: Latn
7
+ name: Kannada Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Kannada
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the superscript sign (◌್).
25
+
26
+ - |
27
+ Exception: Anusvāra is transliterated by:
28
+
29
+ a) ṅ before gutturals,
30
+ b) ñ before palatals,
31
+ c) ṇ before cerebrals,
32
+ d) n before dentals, and
33
+ e) m before labials.
34
+
35
+
36
+ tests:
37
+ - source: "ಕರ್ಣಾಟಕ"
38
+ expected: "karṇāṭaka"
39
+ - source: "ಬೆಂಗಳೂರು"
40
+ expected: "beṅgaḷūru"
41
+ - source: "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ"
42
+ expected: "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
43
+ - source: "ದೇವರ ಹೆಸರು ಬಳಸಿ ಆನ್‌ಲೈನ್‌ ಬೆಟ್ಟಿಂಗ್‌!"
44
+ expected: "dēvara hesaru baḷasi ānlain beṭṭiṃg!"
45
+ - source: "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ"
46
+ expected: "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
47
+ - source: "ಸ್ವಾಮಿತ್ವ: ಹೊಸ ಯೋಜನೆಯಿಂದ ನಮಗೆ ಏನು ಲಾಭ ?"
48
+ expected: "svāmitva: hosa yōjaneyinda namage ēnu lābha ?"
49
+ - source: "ಮರಳು ಸಾಗಾಣಿಕೆ ವ್ಯವಹಾರ ಆಗಬಾರದು :ಅಧಿಕಾರಿಗಳಿಗೆ ಖಡಕ್ ಸೂಚನೆ ನೀಡಿದ ಜಿಲ್ಲಾಧಿಕಾರಿ"
50
+ expected: "maraḷu sāgāṇike vyavahāra āgabāradu :adhikārigaḷige khaḍak sūcane nīḍida jillādhikāri"
51
+ - source: "ಹಾವೇರಿ ಜಿಲ್ಲೆಯಲ್ಲಿ ೯೭ ಜನರಲ್ಲಿ ಕೋವಿಡ್ ಸೋಂಕು ಪತ್ತೆ ; 54 ಮಂದಿ ಗುಣಮುಖ"
52
+ expected: "hāvēri jilleyalli 97 janaralli kōviḍ sōṃku patte ; 54 maṃdi guṇamukha"
53
+ - source: "ಸಿಂದಗಿ ಐಸಿಐಸಿಐ ಬ್ಯಾಂಕ್ ಸೆಕ್ಯುರಿಟಿ ಗಾರ್ಡ್ ಹತ್ಯೆ ಪ್ರಕರಣ ಭೇದಿಸಿದ ಪೊಲೀಸರು"
54
+ expected: "sindagi aisiaisiai byāṃk sekyuriṭi gārḍ hatye prakaraṇa bhēdisida polīsaru"
55
+ - source: "ಬ್ಯಾಂಕರ್‌ಗಳೊಂದಿಗೆ ಡಿವಿ ಸಭೆ : ಆಧ್ಯತಾ ವಲಯ, ಸಾಲ ಯೋಜನೆ ತ್ವರಿತ ಮಂಜೂರಿಗೆ ಸೂಚನೆ"
56
+ expected: "byāṅkargaḷoṃdige ḍivi sabhe : ādhyatā valaya, sāla yōjane tvarita maṃjūrige sūcane"
57
+ - source: "ಪೊಲೀಸ್‌ ಇಲಾಖೆ ಸಮಗ್ರ ಅಭಿವೃದ್ಧಿ; ಡಿಜಿಪಿ ನೇತೃತ್ವದಲ್ಲಿ ಸಮಿತಿ ರಚನೆ: ಬೊಮ್ಮಾಯಿ"
58
+ expected: "polīs ilākhe samagra abhivṛddhi; ḍijipi nētṛtvadalli samiti racane: beūmmāyi"
59
+ - source: "ಕೆಟ್ಟಿರುವ ರಸ್ತೆಗಳ ದುರಸ್ತಿಗೆ ಸರಕಾರದ ಯೋಜನೆ"
60
+ expected: "keṭṭiruva rastegaḷa durastige sarakārada yōjane"
61
+
62
+ map:
63
+
64
+
65
+ rules:
66
+ # to cover diacritic and vowel less consonants rule II
67
+ - pattern: ([ಕ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
68
+ result: 'k'
69
+ - pattern: ([ಖ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
70
+ result: 'kh'
71
+ - pattern: ([ಗ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
72
+ result: 'g'
73
+ - pattern: ([ಘ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
74
+ result: 'gh'
75
+ - pattern: ([ಙ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
76
+ result: 'ṅ'
77
+ - pattern: ([ಚ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
78
+ result: 'c'
79
+ - pattern: ([ಛ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
80
+ result: 'ch'
81
+ - pattern: ([ಜ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
82
+ result: 'j'
83
+ - pattern: ([ಝ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
84
+ result: 'jh'
85
+ - pattern: ([ಞ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
86
+ result: 'ñ'
87
+ - pattern: ([ಟ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
88
+ result: 'ṭ'
89
+ - pattern: ([ಠ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
90
+ result: 'ṭh'
91
+ - pattern: ([ಡ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
92
+ result: 'ḍ'
93
+ - pattern: ([ಢ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
94
+ result: 'ḍh'
95
+ - pattern: ([ಣ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
96
+ result: 'ṇ'
97
+ - pattern: ([ತ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
98
+ result: 't'
99
+ - pattern: ([ಥ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
100
+ result: 'th'
101
+ - pattern: ([ದ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
102
+ result: 'd'
103
+ - pattern: ([ಧ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
104
+ result: 'dh'
105
+ - pattern: ([ನ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
106
+ result: 'n'
107
+ - pattern: ([ಪ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
108
+ result: 'p'
109
+ - pattern: ([ಫ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
110
+ result: 'ph'
111
+ - pattern: ([ಬ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
112
+ result: 'b'
113
+ - pattern: ([ಭ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
114
+ result: 'bh'
115
+ - pattern: ([ಮ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
116
+ result: 'm'
117
+ - pattern: ([ಯ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
118
+ result: 'y'
119
+ - pattern: ([ರ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
120
+ result: 'r'
121
+ - pattern: ([ಱ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
122
+ result: 'ṟ'
123
+ - pattern: ([ಲ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
124
+ result: 'l'
125
+ - pattern: ([ಳ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
126
+ result: 'ḷ'
127
+ - pattern: ([ೞ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
128
+ result: 'l̤'
129
+ - pattern: ([ವ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
130
+ result: 'v'
131
+ - pattern: ([ಶ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
132
+ result: 'ś'
133
+ - pattern: ([ಷ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
134
+ result: 'ṣ'
135
+ - pattern: ([ಸ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
136
+ result: 's'
137
+ - pattern: ([ಹ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
138
+ result: 'h'
139
+
140
+ # rule[III]
141
+ - pattern: \u0C82(?=[ಕಖಗಘಙ])
142
+ result: ṅ
143
+ - pattern: \u0C82(?=[ಚಛಜಝಞ])
144
+ result: ñ
145
+ - pattern: \u0C82(?=[ಟಠಡಢಣ])
146
+ result: ṇ
147
+ - pattern: \u0C82(?=[ತಥದಧನ])
148
+ result: n
149
+
150
+ characters:
151
+ 'ಅ': 'a'
152
+ 'ಆ': 'ā'
153
+ 'ಇ': 'i'
154
+ 'ಈ': 'ī'
155
+ 'ಉ': 'u'
156
+ 'ಊ': 'ū'
157
+ 'ಋ': 'ṛ'
158
+ 'ೠ': 'ṝ'
159
+
160
+ 'ಌ': 'ḻ'
161
+
162
+ 'ಎ': 'e'
163
+ 'ಏ': 'ē'
164
+ 'ಐ': 'ai'
165
+
166
+ 'ಒ': 'o'
167
+ 'ಓ': 'ō'
168
+ 'ಔ': 'au'
169
+
170
+ # Gutturals
171
+ 'ಕ': 'ka'
172
+ 'ಖ': 'kha'
173
+ 'ಗ': 'ga'
174
+ 'ಘ': 'gha'
175
+ 'ಙ': 'ṅa'
176
+
177
+ # Palatals
178
+ 'ಚ': 'ca'
179
+ 'ಛ': 'cha'
180
+ 'ಜ': 'ja'
181
+ 'ಝ': 'jha'
182
+ 'ಞ': 'ña'
183
+
184
+ # Cerebrals
185
+ 'ಟ': 'ṭa'
186
+ 'ಠ': 'ṭha'
187
+ 'ಡ': 'ḍa'
188
+ 'ಢ': 'ḍha'
189
+ 'ಣ': 'ṇa'
190
+
191
+ # Dentals
192
+ 'ತ': 'ta'
193
+ 'ಥ': 'tha'
194
+ 'ದ': 'da'
195
+ 'ಧ': 'dha'
196
+ 'ನ': 'na'
197
+
198
+ # Labials
199
+ 'ಪ': 'pa'
200
+ 'ಫ': 'pha'
201
+ 'ಬ': 'ba'
202
+ 'ಭ': 'bha'
203
+ 'ಮ': 'ma'
204
+
205
+ # Semivowels
206
+ 'ಯ': 'ya'
207
+ 'ರ': 'ra'
208
+ 'ಱ': 'ṟa'
209
+ 'ಲ': 'la'
210
+ 'ಳ': 'ḷa'
211
+ 'ೞ': 'l̤a'
212
+
213
+
214
+ 'ವ': 'va'
215
+
216
+ # Sibilants
217
+ 'ಶ': 'śa'
218
+ 'ಷ': 'ṣa'
219
+ 'ಸ': 'sa'
220
+
221
+
222
+ # Aspirate
223
+ 'ಹ': 'ha'
224
+
225
+
226
+ # Bisarga
227
+ 'ಃ': 'ḥ'
228
+
229
+ # Anusvāra
230
+ 'ಂ': 'ṃ'
231
+
232
+ '\u0cbc': '' #nukta
233
+
234
+ # Medials # Needed for connecting constants
235
+ 'ಾ': "ā"
236
+ 'ಿ': "i"
237
+ 'ೀ': "ī"
238
+ 'ು': "u"
239
+ 'ೂ': "ū"
240
+ 'ೃ': "ṛ"
241
+ 'ೄ': "ṝ"
242
+ '\u0CE2': 'ḻ' # KANNADA VOWEL SIGN VOCALIC L ( ೢ)
243
+
244
+
245
+ 'ೆ': "e"
246
+ 'ೇ': "ē"
247
+ 'ೈ': "ai"
248
+
249
+
250
+ 'ೊ': 'o'
251
+ 'ೋ': 'ō'
252
+ 'ೌ': 'au'
253
+
254
+
255
+ '्': ''
256
+ '़': ''
257
+ '್': '' # used for pronounciation without vowel
258
+ "‍": '' # no need for zero with joiner
259
+ "‌": '' # no need for zero with non joiner
260
+
261
+
262
+
263
+ # Digits
264
+
265
+ '೦': '0'
266
+ '೧': '1'
267
+ '೨': '2'
268
+ '೩': '3'
269
+ '೪': '4'
270
+ '೫': '5'
271
+ '೬': '6'
272
+ '೭': '7'
273
+ '೮': '8'
274
+ '೯': '9'