interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,57 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:guj
5
+ source_script: Gujr
6
+ destination_script: Latn
7
+ name: Gujarati Romanization, 2011
8
+ url: https://www.loc.gov/catdir/cpso/romanization/gujarati.pdf
9
+ creation_date: 2011
10
+ description: |
11
+ ALA-LC Romanization table for Gujarati
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+ a) when another vowel is indicated by its appropriate sign and
23
+ b) when the absence of any vowel is indicated by the subscript symbol ( ્ ) called halanta or
24
+ virāma.
25
+
26
+ - |
27
+ Exception: Anusvāra is transliterated by:
28
+ a) ṅ before gutturals,
29
+ b) ñ before palatals,
30
+ c) ṇ before cerebrals,
31
+ d) n before dentals, and
32
+ e) m before labials.
33
+
34
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
35
+ }
36
+
37
+ tests {
38
+ test "મોર્ગન અને રસેલ ફ્લોપ રહ્યા", "mȏrgana anȇ rasȇla phlȏpa rahyā"
39
+ test "રોયલ ચેલેન્જર્સ બેંગલોરના કેપ્ટન વિરાટ કોહલીએ કોલકાતા નાઈટ રાઈડર્સ સામે શારજાહ ખાતે ટોસ જીતીને બેટિંગ લીધી છે.", "rȏyala cȇlȇnjarsa bȇṅgalȏranā kȇpṭana virāṭa kȏhalīȇ kȏlakātā nāīṭa rāīḍarsa sāmȇ śārajāha khātȇ ṭȏsa jītīnȇ bȇṭiṅga līdhī chȇ."
40
+ test "અમદાવાદમાં ભણી ચૂકેલા શ્રીકાંત દાતાર પ્રતિષ્ઠિત હાર્વર્ડ બિઝનેસ સ્કૂલના ડીન બન્યા", "amadāvādamāṃ bhaṇī cūkȇlā śrīkānta dātāra pratishṭhita hārvarḍa bijhanȇsa skūlanā ḍīna banyā"
41
+ test "ઓગસ્ટ મહિનામાં મેન્યુફેક્ચરિંગ સેક્ટરનું ઉત્પાદન ગગડ્યુ", "ȏgasṭa mahināmāṃ mȇnyuphȇkcariṅga sȇkṭaranuṃ utpādana gagaḍyu"
42
+ test "૯૦ વર્ષમાં બે કરોડમાંથી પોણાબે લાખ કરોડ થઈ ગઈ ટાટા ગ્રુપમાં મિસ્ત્રી પરિવારની શેર્સ વેલ્યુ, જૂના સંબંધો અંત ભણી, જાણો કોને શું મળશે, કોણ શું ગુમાવશે?", "90 varshamāṃ bȇ karȏḍamānthī pȏṇābȇ lākha karȏḍa thaī gaī ṭāṭā grupamāṃ mistrī parivāranī śȇrsa vȇlyu, jūnā sambandhȏ anta bhaṇī, jāṇȏ kȏnȇ śuṃ maḷaśȇ, kȏṇa śuṃ gumāvaśȇ?"
43
+ test "મુંબઈના એક સ્ટોક બ્રોકરે જણાવ્યું કે ટાટા પોતાના શેર બહાર જતા રોકવા માટે SP ગ્રુપ સાથે સમજૂતી કરી શકે છે.", "mumbaīnā ȇka sṭȏka brȏkarȇ jaṇāvyuṃ kȇ ṭāṭā pȏtānā śȇra bahāra jatā rȏkavā māṭȇ SP grupa sāthȇ samajūtī karī śakȇ chȇ."
44
+ test "કોલકાતા નાઈટ રાઈડર્સનો ઓફ સ્પિનર સુનીલ નારાયણ વિવાદમાં ફસાઈ ગયો છે", "kȏlakātā nāīṭa rāīḍarsanȏ ȏpha spinara sunīla nārāyaṇa vivādamāṃ phasāī gayȏ chȇ"
45
+ test "ટાટા અને મિસ્ત્રી પરિવાર વચ્ચે શેર્સની આપ-લે થાય એ માટે કોઈ પારસી વ્યક્તિને મધ્યસ્થી બનાવી શકાય છે અને આ માટે રતન ટાટા પણ પ્રયત્નો કરી શકે છે", "ṭāṭā anȇ mistrī parivāra vaccȇ śȇrsanī āpa-lȇ thāya ȇ māṭȇ kȏī pārasī vyaktinȇ madhyasthī banāvī śakāya chȇ anȇ ā māṭȇ ratana ṭāṭā paṇa prayatnȏ karī śakȇ chȇ"
46
+ test "મેદાની અમ્પાયરોએ પંજાબ વિરુદ્ધની મેચમાં તેની બોલિંગ એક્શન બાબતે શંકા વ્યક્ત કરી હતી. ફરિયાદ પછી હવે નારાયણને વોર્નિંગ લિસ્ટમાં નાખી દેવાયો છે", "mȇdānī ampāyarȏȇ pañjāba viruddhanī mȇcamāṃ tȇnī bȏliṅga ȇkśana bābatȇ śaṅkā vyakta karī hatī. phariyāda pachī havȇ nārāyaṇanȇ vȏrniṅga lisṭamāṃ nākhī dȇvāyȏ chȇ"
47
+ test "મોદી સરકારના આત્મનિર્ભર ભારત અભિયાનને સફળતા, પાંચ મહિનામાં ચીન સાથેની વેપાર ખાધ અડધી થઈ ગઈ, ચાઈનિઝ સ્માર્ટફોનની હિસ્સેદારી પણ ઘટી", "mȏdī sarakāranā ātmanirbhara bhārata abhiyānanȇ saphaḷatā, pāñca mahināmāṃ cīna sāthȇnī vȇpāra khādha aḍadhī thaī gaī, cāīnijha smārṭaphȏnanī hissȇdārī paṇa ghaṭī"
48
+ }
49
+
50
+ dependency "alalc-guj-Gujr-Latn-1997", as: gujrlatn
51
+
52
+ stage {
53
+
54
+ run map.gujrlatn.stage.main
55
+
56
+ }
57
+
@@ -0,0 +1,248 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Hindi Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/hindi.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Hindi
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+
36
+ - Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
37
+ labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
38
+
39
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
40
+ }
41
+
42
+ tests {
43
+ test "हम", "hama"
44
+ test "मीन", "mīna"
45
+ test "औसत", "ăusata"
46
+ test "माँऽऽऽ!", "mān̐’’’!"
47
+ test "माँ", "mām̐"
48
+ test "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर", "gaṃbhīr marījoṃ ke māmale meṃ bhārat dūsare naṃbar para"
49
+ test "कोरोना अपडेट्स", "koronā apaḍeṭsa"
50
+ test "सीडीसी चीफ का बयान अहम", "sīḍīsī cīph kā bayān ahama"
51
+ test "गूगल प्ले स्टोर पर पेटीएम की वापसी", "gūgal ple sṭor par peṭīem kī vāpasī"
52
+ test "भारत में गैंबलिंग की इजाजत नहीं", "bhārat meṃ gaiṃbaliṃg kī ijājat nahīṃ"
53
+ test "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं", "koronā vaiksīn mudde par ghire rāshṭrapati; jo bāiḍen bole- mujhe ăur deś ko vaijñānikoṃ par bharosā hai, ḍonālḍ ṭramp par nahīṃ"
54
+ test "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं", "gūgal kī kārravāī par peṭīem ne kahā thā ki aip ko asthāyī tăur par ple-sṭor se haṭāyā gayā hai, āpake paise surakshit haiṃ"
55
+ test "२५६८७५४४६४४६१६११", "2568754464461611"
56
+ }
57
+
58
+ aliases {
59
+ def_alias hin_cons_or_conscluster, any("\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d")
60
+ }
61
+
62
+ stage {
63
+
64
+ # RULES
65
+ # note[2]
66
+ sub capture("क" + maybe("=")), "k", after: hin_cons_or_conscluster
67
+ sub capture("क़" + maybe("=")), "q", after: hin_cons_or_conscluster
68
+ sub capture("ख" + maybe("=")), "kh", after: hin_cons_or_conscluster
69
+ sub capture("ख़" + maybe("=")), "kh", after: hin_cons_or_conscluster
70
+ sub capture("ग" + maybe("=")), "g", after: hin_cons_or_conscluster
71
+ sub capture("ग़" + maybe("=")), "gh", after: hin_cons_or_conscluster
72
+ sub capture("घ" + maybe("=")), "gh", after: hin_cons_or_conscluster
73
+ sub capture("ङ" + maybe("=")), "ṅ", after: hin_cons_or_conscluster
74
+ sub capture("च" + maybe("=")), "c", after: hin_cons_or_conscluster
75
+ sub capture("छ" + maybe("=")), "ch", after: hin_cons_or_conscluster
76
+ sub capture("ज" + maybe("=")), "j", after: hin_cons_or_conscluster
77
+ sub capture("ज़" + maybe("=")), "j", after: hin_cons_or_conscluster
78
+ sub capture("झ" + maybe("=")), "jh", after: hin_cons_or_conscluster
79
+ sub capture("ञ" + maybe("=")), "ñ", after: hin_cons_or_conscluster
80
+ sub capture("ट" + maybe("=")), "ṭ", after: hin_cons_or_conscluster
81
+ sub capture("ट़" + maybe("=")), "t̤", after: hin_cons_or_conscluster
82
+ sub capture("ठ" + maybe("=")), "ṭh", after: hin_cons_or_conscluster
83
+ sub capture("ड" + maybe("=")), "ḍ", after: hin_cons_or_conscluster
84
+ sub capture("ड़" + maybe("=")), "ṛ", after: hin_cons_or_conscluster
85
+ sub capture("ड़" + maybe("=")), "ṛ", after: hin_cons_or_conscluster
86
+ sub capture("ढ" + maybe("=")), "ḍh", after: hin_cons_or_conscluster
87
+ sub capture("ढ़" + maybe("=")), "ṛh", after: hin_cons_or_conscluster
88
+ sub capture("ण" + maybe("=")), "ṇ", after: hin_cons_or_conscluster
89
+ sub capture("त" + maybe("=")), "t", after: hin_cons_or_conscluster
90
+ sub capture("थ" + maybe("=")), "th", after: hin_cons_or_conscluster
91
+ sub capture("द" + maybe("=")), "d", after: hin_cons_or_conscluster
92
+ sub capture("ध" + maybe("=")), "dh", after: hin_cons_or_conscluster
93
+ sub capture("न" + maybe("=")), "n", after: hin_cons_or_conscluster
94
+ sub capture("प" + maybe("=")), "p", after: hin_cons_or_conscluster
95
+ sub capture("फ" + maybe("=")), "ph", after: hin_cons_or_conscluster
96
+ sub capture("फ़" + maybe("=")), "ph", after: hin_cons_or_conscluster
97
+ sub capture("ब" + maybe("=")), "b", after: hin_cons_or_conscluster
98
+ sub capture("भ" + maybe("=")), "bh", after: hin_cons_or_conscluster
99
+ sub capture("म" + maybe("=")), "m", after: hin_cons_or_conscluster
100
+ sub capture("य" + maybe("=")), "y", after: hin_cons_or_conscluster
101
+ sub capture("र" + maybe("=")), "r", after: hin_cons_or_conscluster
102
+ sub capture("ल" + maybe("=")), "l", after: hin_cons_or_conscluster
103
+ sub capture("व" + maybe("=")), "v", after: hin_cons_or_conscluster
104
+ sub capture("श" + maybe("=")), "ś", after: hin_cons_or_conscluster
105
+ sub capture("ष" + maybe("=")), "sh", after: hin_cons_or_conscluster
106
+ sub capture("स" + maybe("=")), "s", after: hin_cons_or_conscluster
107
+ sub capture("स़" + maybe("=")), "s̤", after: hin_cons_or_conscluster
108
+ sub capture("ह" + maybe("=")), "h", after: hin_cons_or_conscluster
109
+ sub capture("ह़" + maybe("=")), "h", after: hin_cons_or_conscluster
110
+
111
+ # note[3]
112
+ sub "\u0902", "ṅ", after: any("कक़खख़गग़घङ")
113
+ sub "\u0902", "ñ", after: any("चछजज़झञ")
114
+ sub "\u0902", "ṇ", after: any("टट़ठडड़ढढ़ण")
115
+ sub "\u0902", "n", after: any("तथदधन")
116
+ # note[4]
117
+ sub "\u0901", "m̐", after: boundary, before: ""
118
+
119
+
120
+ # CHARACTERS
121
+ parallel {
122
+
123
+ # I. Vowels and Diphthongs (see Note 1)
124
+
125
+ sub "अ", "a"
126
+ sub "आ", "ā"
127
+ sub "इ", "i"
128
+ sub "ई", "ī"
129
+ sub "उ", "u"
130
+ sub "ऊ", "ū"
131
+ sub "ऋ", "ṛ"
132
+ sub "ॠ", "ṝ"
133
+ sub "ऌ", "ḷ"
134
+ sub "ॳ", "ĕ"
135
+ sub "ए", "e"
136
+ sub "ॲ", "ê"
137
+ sub "अै", "ăi"
138
+ sub "ऐ", "ai"
139
+ sub "ऒ", "ŏ"
140
+ sub "ओ", "o"
141
+ sub "ऑ", "ô"
142
+ sub "औ", "ău"
143
+
144
+ # II. Consonants (see Note 2)
145
+ # Gutturals
146
+ sub "क", "ka"
147
+ sub "क़", "qa"
148
+ sub "ख", "kha"
149
+ sub "ख़", "kha"
150
+ sub "ग", "ga"
151
+ sub "ग़", "gha"
152
+ sub "घ", "gha"
153
+ sub "ङ", "ṅa"
154
+
155
+ # Palatals
156
+ sub "च", "ca"
157
+ sub "छ", "cha"
158
+ sub "ज", "ja"
159
+ sub "ज़", "ja"
160
+ sub "झ", "jha"
161
+ sub "ञ", "ña"
162
+
163
+ # Cerebrals
164
+ sub "ट", "ṭa"
165
+ sub "ट़", "t̤a"
166
+ sub "ठ", "ṭha"
167
+ sub "ड", "ḍa"
168
+ sub "ड़", "ṛa"
169
+ sub "ड़", "ṛa"
170
+ sub "ढ", "ḍha"
171
+ sub "ढ़", "ṛha"
172
+ sub "ण", "ṇa"
173
+
174
+ # Dentals
175
+ sub "त", "ta"
176
+ sub "थ", "tha"
177
+ sub "द", "da"
178
+ sub "ध", "dha"
179
+ sub "न", "na"
180
+
181
+ # Labials
182
+ sub "प", "pa"
183
+ sub "फ", "pha"
184
+ sub "फ़", "pha"
185
+ sub "ब", "ba"
186
+ sub "भ", "bha"
187
+ sub "म", "ma"
188
+
189
+ # Semivowels
190
+ sub "य", "ya"
191
+ sub "र", "ra"
192
+ sub "ल", "la"
193
+ sub "व", "va"
194
+
195
+ # Sibilants
196
+ sub "श", "śa"
197
+ sub "ष", "sha"
198
+ sub "स", "sa"
199
+ sub "स़", "s̤a"
200
+
201
+ # Aspirate
202
+ sub "ह", "ha"
203
+ sub "ह़", "ha"
204
+
205
+ # Anusvāra
206
+ sub "ं", "ṃ"
207
+
208
+ # Bisarga
209
+ sub "ः ", "ḥ"
210
+
211
+ # Anunāsika
212
+ sub "ँ", "n̐" # ঁ : n̐, m̐
213
+
214
+ # Abagraha
215
+ sub "ऽ", "’" # (apostrophe)
216
+
217
+ # Medials # Needed for connecting constants
218
+ sub "ा", "ā"
219
+ sub "ॉ", "ô"
220
+ sub "ि", "i"
221
+ sub "ी", "ī"
222
+ sub "ु", "u"
223
+ sub "ू", "ū"
224
+ sub "ृ", "ṛ"
225
+ sub "ॄ", "ṝ"
226
+ sub "े", "e"
227
+ sub "ॊ", "ŏ"
228
+ sub "ौ", "ău"
229
+ sub "ै", "ai"
230
+ sub "ो", "o"
231
+ sub "्", ""
232
+ sub "़", ""
233
+
234
+ # digits
235
+
236
+ sub "०", "0"
237
+ sub "१", "1"
238
+ sub "२", "2"
239
+ sub "३", "3"
240
+ sub "४", "4"
241
+ sub "५", "5"
242
+ sub "६", "6"
243
+ sub "७", "7"
244
+ sub "८", "8"
245
+ sub "९", "9"
246
+ }
247
+ compose
248
+ }
@@ -0,0 +1,63 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Hindi Romanization, 2011
8
+ url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Hindi
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+
36
+ - Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
37
+ labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
38
+
39
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
40
+ }
41
+
42
+ tests {
43
+ test "इस चुनौतीपूर्ण समय में 'वर्क फ्रॉम होम’ सामान्य बन चुका है", "is cunăutīpūrṇ samay meṃ 'vark phrôm homa’ sāmāny ban cukā hai"
44
+ test "दिल्ली में त्योहार पर खरीददारी करने निकले बड़ी संख्या में लोग, कई जगहों पर लगा भीषण जाम", "dillī meṃ tyohār par kharīdadārī karane nikale baṛī saṃkhyā meṃ loga, kaī jagahoṃ par lagā bhīshaṇ jāma"
45
+ test "सरकार ने पेंशन भोगियों को लाइफ सर्टिफिकेट जमा कराने के मामले में दी बड़ी राहत", "sarakār ne peṃśan bhogiyoṃ ko lāiph sarṭiphikeṭ jamā karāne ke māmale meṃ dī baṛī rāhata"
46
+ test "कांग्रेस ने माना उसके लचर प्रदर्शन ने डुबोई महागठबंधन की लुटिया, पार्टी में उठने लगी आत्ममंथन की आवाज", "kāṃgres ne mānā usake lacar pradarśan ne ḍuboī mahāgaṭhabandhan kī luṭiyā, pārṭī meṃ uṭhane lagī ātmamanthan kī āvāja"
47
+ test "डिजिटल पेमेंट सिस्टम ने छोटे-मध्यम कारोबारों का दिया साथ, कोरोना की परेशानियों को किया कम", "ḍijiṭal pemeṃṭ sisṭam ne choṭe-madhyam kārobāroṃ kā diyā sātha, koronā kī pareśāniyoṃ ko kiyā kama"
48
+ test "छोटे व्यापारियों को ढूंढें, उनसे खरीदें और उनका साथ दें", "choṭe vyāpāriyoṃ ko ḍhūṃḍheṃ, unase kharīdeṃ ăur unakā sāth deṃ"
49
+ test "भारत के साथ साझीदारी को महत्व देंगे बाइडन, ओबामा प्रशासन में रहीं वरिष्ठ अधिकारी एलिसा ने जताई उम्मीद", "bhārat ke sāth sājhīdārī ko mahatv deṃge bāiḍana, obāmā praśāsan meṃ rahīṃ varishṭh adhikārī elisā ne jatāī ummīda"
50
+ test "दो महीने से कोमा में था युवक, चिकन की चर्चा सुनते ही आया होश", "do mahīne se komā meṃ thā yuvaka, cikan kī carcā sunate hī āyā hośa"
51
+ test "कोरोना के टीके पर खुशखबरी, भारत पहुंची रूसी वैक्सीन की पहली खेप", "koronā ke ṭīke par khuśakhabarī, bhārat pahuṃcī rūsī vaiksīn kī pahalī khepa"
52
+ test "दिल्ली के गांधी नगर स्थित एक दुकान में लगी भीषण आग, दमकल की 20 गाड़ियां मौके पर", "dillī ke gāṃdhī nagar sthit ek dukān meṃ lagī bhīshaṇ āga, damakal kī 20 gāṛiyāṃ măuke para"
53
+ }
54
+
55
+
56
+ dependency "alalc-hin-Deva-Latn-1997", as: devalatn
57
+
58
+ stage {
59
+
60
+ run map.devalatn.stage.main
61
+
62
+ }
63
+
@@ -0,0 +1,233 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:kan
5
+ source_script: Kana
6
+ destination_script: Latn
7
+ name: Kannada Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Kannada
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the superscript sign (◌್).
25
+
26
+ - |
27
+ Exception: Anusvāra is transliterated by:
28
+
29
+ a) ṅ before gutturals,
30
+ b) ñ before palatals,
31
+ c) ṇ before cerebrals,
32
+ d) n before dentals, and
33
+ e) m before labials.
34
+ }
35
+
36
+ tests {
37
+ test "ಕರ್ಣಾಟಕ", "karṇāṭaka"
38
+ test "ಬೆಂಗಳೂರು", "beṅgaḷūru"
39
+ test "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ", "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
40
+ test "ದೇವರ ಹೆಸರು ಬಳಸಿ ಆನ್‌ಲೈನ್‌ ಬೆಟ್ಟಿಂಗ್‌!", "dēvara hesaru baḷasi ānlain beṭṭiṃg!"
41
+ test "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ", "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
42
+ test "ಸ್ವಾಮಿತ್ವ: ಹೊಸ ಯೋಜನೆಯಿಂದ ನಮಗೆ ಏನು ಲಾಭ ?", "svāmitva: hosa yōjaneyinda namage ēnu lābha ?"
43
+ test "ಮರಳು ಸಾಗಾಣಿಕೆ ವ್ಯವಹಾರ ಆಗಬಾರದು :ಅಧಿಕಾರಿಗಳಿಗೆ ಖಡಕ್ ಸೂಚನೆ ನೀಡಿದ ಜಿಲ್ಲಾಧಿಕಾರಿ", "maraḷu sāgāṇike vyavahāra āgabāradu :adhikārigaḷige khaḍak sūcane nīḍida jillādhikāri"
44
+ test "ಹಾವೇರಿ ಜಿಲ್ಲೆಯಲ್ಲಿ ೯೭ ಜನರಲ್ಲಿ ಕೋವಿಡ್ ಸೋಂಕು ಪತ್ತೆ ; 54 ಮಂದಿ ಗುಣಮುಖ", "hāvēri jilleyalli 97 janaralli kōviḍ sōṃku patte ; 54 maṃdi guṇamukha"
45
+ test "ಸಿಂದಗಿ ಐಸಿಐಸಿಐ ಬ್ಯಾಂಕ್ ಸೆಕ್ಯುರಿಟಿ ಗಾರ್ಡ್ ಹತ್ಯೆ ಪ್ರಕರಣ ಭೇದಿಸಿದ ಪೊಲೀಸರು", "sindagi aisiaisiai byāṃk sekyuriṭi gārḍ hatye prakaraṇa bhēdisida polīsaru"
46
+ test "ಬ್ಯಾಂಕರ್‌ಗಳೊಂದಿಗೆ ಡಿವಿ ಸಭೆ : ಆಧ್ಯತಾ ವಲಯ, ಸಾಲ ಯೋಜನೆ ತ್ವರಿತ ಮಂಜೂರಿಗೆ ಸೂಚನೆ", "byāṅkargaḷoṃdige ḍivi sabhe : ādhyatā valaya, sāla yōjane tvarita maṃjūrige sūcane"
47
+ test "ಪೊಲೀಸ್‌ ಇಲಾಖೆ ಸಮಗ್ರ ಅಭಿವೃದ್ಧಿ; ಡಿಜಿಪಿ ನೇತೃತ್ವದಲ್ಲಿ ಸಮಿತಿ ರಚನೆ: ಬೊಮ್ಮಾಯಿ", "polīs ilākhe samagra abhivṛddhi; ḍijipi nētṛtvadalli samiti racane: beūmmāyi"
48
+ test "ಕೆಟ್ಟಿರುವ ರಸ್ತೆಗಳ ದುರಸ್ತಿಗೆ ಸರಕಾರದ ಯೋಜನೆ", "keṭṭiruva rastegaḷa durastige sarakārada yōjane"
49
+ }
50
+
51
+ aliases {
52
+ def_alias kana_chars_1, any("\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd")
53
+ }
54
+
55
+ stage {
56
+
57
+ # RULES
58
+ # to cover diacritic and vowel less consonants rule II
59
+ sub "ಕ", "k", after: kana_chars_1
60
+ sub "ಖ", "kh", after: kana_chars_1
61
+ sub "ಗ", "g", after: kana_chars_1
62
+ sub "ಘ", "gh", after: kana_chars_1
63
+ sub "ಙ", "ṅ", after: kana_chars_1
64
+ sub "ಚ", "c", after: kana_chars_1
65
+ sub "ಛ", "ch", after: kana_chars_1
66
+ sub "ಜ", "j", after: kana_chars_1
67
+ sub "ಝ", "jh", after: kana_chars_1
68
+ sub "ಞ", "ñ", after: kana_chars_1
69
+ sub "ಟ", "ṭ", after: kana_chars_1
70
+ sub "ಠ", "ṭh", after: kana_chars_1
71
+ sub "ಡ", "ḍ", after: kana_chars_1
72
+ sub "ಢ", "ḍh", after: kana_chars_1
73
+ sub "ಣ", "ṇ", after: kana_chars_1
74
+ sub "ತ", "t", after: kana_chars_1
75
+ sub "ಥ", "th", after: kana_chars_1
76
+ sub "ದ", "d", after: kana_chars_1
77
+ sub "ಧ", "dh", after: kana_chars_1
78
+ sub "ನ", "n", after: kana_chars_1
79
+ sub "ಪ", "p", after: kana_chars_1
80
+ sub "ಫ", "ph", after: kana_chars_1
81
+ sub "ಬ", "b", after: kana_chars_1
82
+ sub "ಭ", "bh", after: kana_chars_1
83
+ sub "ಮ", "m", after: kana_chars_1
84
+ sub "ಯ", "y", after: kana_chars_1
85
+ sub "ರ", "r", after: kana_chars_1
86
+ sub "ಱ", "ṟ", after: kana_chars_1
87
+ sub "ಲ", "l", after: kana_chars_1
88
+ sub "ಳ", "ḷ", after: kana_chars_1
89
+ sub "ೞ", "l̤", after: kana_chars_1
90
+ sub "ವ", "v", after: kana_chars_1
91
+ sub "ಶ", "ś", after: kana_chars_1
92
+ sub "ಷ", "ṣ", after: kana_chars_1
93
+ sub "ಸ", "s", after: kana_chars_1
94
+ sub "ಹ", "h", after: kana_chars_1
95
+
96
+ # rule[III]
97
+ sub "\u0C82", "ṅ", after: any("ಕಖಗಘಙ")
98
+ sub "\u0C82", "ñ", after: any("ಚಛಜಝಞ")
99
+ sub "\u0C82", "ṇ", after: any("ಟಠಡಢಣ")
100
+ sub "\u0C82", "n", after: any("ತಥದಧನ")
101
+
102
+
103
+ # CHARACTERS
104
+ parallel {
105
+ sub "ಅ", "a"
106
+ sub "ಆ", "ā"
107
+ sub "ಇ", "i"
108
+ sub "ಈ", "ī"
109
+ sub "ಉ", "u"
110
+ sub "ಊ", "ū"
111
+ sub "ಋ", "ṛ"
112
+ sub "ೠ", "ṝ"
113
+
114
+ sub "ಌ", "ḻ"
115
+
116
+ sub "ಎ", "e"
117
+ sub "ಏ", "ē"
118
+ sub "ಐ", "ai"
119
+
120
+ sub "ಒ", "o"
121
+ sub "ಓ", "ō"
122
+ sub "ಔ", "au"
123
+
124
+ # Gutturals
125
+ sub "ಕ", "ka"
126
+ sub "ಖ", "kha"
127
+ sub "ಗ", "ga"
128
+ sub "ಘ", "gha"
129
+ sub "ಙ", "ṅa"
130
+
131
+ # Palatals
132
+ sub "ಚ", "ca"
133
+ sub "ಛ", "cha"
134
+ sub "ಜ", "ja"
135
+ sub "ಝ", "jha"
136
+ sub "ಞ", "ña"
137
+
138
+ # Cerebrals
139
+ sub "ಟ", "ṭa"
140
+ sub "ಠ", "ṭha"
141
+ sub "ಡ", "ḍa"
142
+ sub "ಢ", "ḍha"
143
+ sub "ಣ", "ṇa"
144
+
145
+ # Dentals
146
+ sub "ತ", "ta"
147
+ sub "ಥ", "tha"
148
+ sub "ದ", "da"
149
+ sub "ಧ", "dha"
150
+ sub "ನ", "na"
151
+
152
+ # Labials
153
+ sub "ಪ", "pa"
154
+ sub "ಫ", "pha"
155
+ sub "ಬ", "ba"
156
+ sub "ಭ", "bha"
157
+ sub "ಮ", "ma"
158
+
159
+ # Semivowels
160
+ sub "ಯ", "ya"
161
+ sub "ರ", "ra"
162
+ sub "ಱ", "ṟa"
163
+ sub "ಲ", "la"
164
+ sub "ಳ", "ḷa"
165
+ sub "ೞ", "l̤a"
166
+
167
+
168
+ sub "ವ", "va"
169
+
170
+ # Sibilants
171
+ sub "ಶ", "śa"
172
+ sub "ಷ", "ṣa"
173
+ sub "ಸ", "sa"
174
+
175
+
176
+ # Aspirate
177
+ sub "ಹ", "ha"
178
+
179
+
180
+ # Bisarga
181
+ sub "ಃ", "ḥ"
182
+
183
+ # Anusvāra
184
+ sub "ಂ", "ṃ"
185
+
186
+ sub "\u0cbc", "" #nukta
187
+
188
+ # Medials # Needed for connecting constants
189
+ sub "ಾ", "ā"
190
+ sub "ಿ", "i"
191
+ sub "ೀ", "ī"
192
+ sub "ು", "u"
193
+ sub "ೂ", "ū"
194
+ sub "ೃ", "ṛ"
195
+ sub "ೄ", "ṝ"
196
+ sub "\u0CE2", "ḻ" # KANNADA VOWEL SIGN VOCALIC L ( ೢ)
197
+
198
+
199
+ sub "ೆ", "e"
200
+ sub "ೇ", "ē"
201
+ sub "ೈ", "ai"
202
+
203
+
204
+ sub "ೊ", "o"
205
+ sub "ೋ", "ō"
206
+ sub "ೌ", "au"
207
+
208
+
209
+ sub "्", ""
210
+ sub "़", ""
211
+ sub "್", "" # used for pronounciation without vowel
212
+ sub "‍", "" # no need for zero with joiner
213
+ sub "‌", "" # no need for zero with non joiner
214
+
215
+
216
+
217
+ # Digits
218
+
219
+ sub "೦", "0"
220
+ sub "೧", "1"
221
+ sub "೨", "2"
222
+ sub "೩", "3"
223
+ sub "೪", "4"
224
+ sub "೫", "5"
225
+ sub "೬", "6"
226
+ sub "೭", "7"
227
+ sub "೮", "8"
228
+ sub "೯", "9"
229
+ }
230
+
231
+ compose
232
+ }
233
+