interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,63 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:sin
5
+ source_script: Sinh
6
+ destination_script: Latn
7
+ name: Sinhalese Romanization, 2011
8
+ url: https://www.loc.gov/catdir/cpso/romanization/sinhales.pdf
9
+ creation_date: 2011
10
+ description: |
11
+ ALA-LC Romanization table for Sinhalese
12
+
13
+
14
+ notes:
15
+
16
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
17
+ vowels following a consonant can be found in grammars; no distinction between the two is
18
+ made in transliteration.
19
+
20
+ - |
21
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
22
+ transliteration, with the following exceptions:
23
+
24
+ a) when another vowel is indicated by its appropriate sign; and
25
+ b) when the absence of any vowel is indicated by the sign ් called virāma.
26
+
27
+ - |
28
+ Exceptions: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+
36
+ - |
37
+ Exceptions:
38
+ a) when saññaka represents a nasal, it is romanized according to the rule for anusvāra.
39
+ b) when saññaka is combined with an aspirated consonant, the combination is romanized as a non-aspirated, followed by an aspirated consonant.
40
+ }
41
+
42
+ tests {
43
+ test "හිටපු අග්‍රාමාත්‍ය රනිල් වික්‍රමසිංහ අප්‍රේල් 21 ප්‍රහාරය සම්බන්ධයෙන් විමර්ශනය කරන ජනාධිපති පරීක්ෂණ කොමිසම හමුවේ දෙවෙනි දිනටත් සාක්ෂි ලබාදීමට පැමිණෙයි", "hiṭapu agrāmātya ranil vikramasiṃha aprēl 21 prahāraya sambanandhayen vimarśanaya karana janādhipati parīkṣaṇa komisama hamuvē deveni dinaṭat sākṣi labādīmaṭa pămiṇeyi"
44
+ test "පෑලියගොඩ මත්ස්‍ය තොග වෙළෙදපොළට පිවිසෙන පිවිසුම් මාර්ගය පුළුල් කර සංවර්ධනයට පියවර - මහාමාර්ග අමාත්‍ය ජොන්ස්ටන් ප්‍රනාන්දු", "pâliyagoḍa matsya toga veḷedapoḷaṭa pivisena pivisum māraṅgaya puḷul kara saṃvarandhanayaṭa piyavara - mahāmāraṅga amātya jonsaṇṭan pranānandu"
45
+ test "මව්බිමටත් රට වැසියන්ටත් ආශිර්වාද කරමින් වි⁣ශේෂ ආගමික වැඩසටහන් මාලාවක්", "mavbimaṭat raṭa văsiyanaṇṭat āśirvāda karamin vi⁣śēṣa āgamika văḍasaṭahan mālāvak"
46
+ test "මිනුවන්ගොඩ කොරෝනා පොකුරින් තවත් ආසාදිතයින් 49 දෙනකු හඳුනා ගෙන", "minuvanaṅgoḍa korōnā pokurin tavat āsāditayin 49 denaku handunā gena"
47
+ test "ඉරණවිල වෙරළේ නාඳුනන ධීවර යාත‍්‍රා දෙකක්", "iraṇavila veraḷē nāndunana dhīvara yātarā dekak"
48
+ test "මඩකලපුව මංගලාරාමේ හාමුදුරුවන්ට මරණ තර්ජන - ආරක්ෂාවත් අඩුකරලා", "maḍakalapuva maṃgalārāmē hāmuduruvanaṇṭa maraṇa tarañjana - ārakṣāvat aḍukaralā"
49
+ test "හොරට කහ කුඩු හැදූ දෙදෙනෙක් බඩුත් එක්ක දැලේ", "horaṭa kaha kuḍu hădū dedenek baḍut ekaṅka dălē"
50
+ test "ඉංගිරියේ ජලභීතිකාව වැළඳුනු නරියෙකු තෙදිනක මෙහෙයුමකින් අල්ලා ගනී", "iṃgiriyē jalabhītikāva văḷandunu nariyeku tedinaka meheyumakin allā ganī"
51
+ test "බෞද්ධ දර්ශනයට අනුව අපි උපයන ධනය බුද්ධිමත් ලෙස විසර්ජනය කරන්නේ කෙසේ ද?", "baudandha darśanayaṭa anuva api upayana dhanaya budandhimat lesa visarañjanaya karanannē kesē da?"
52
+ test "ඉන්දීය ජාතිකයන් සමග එක්වන මන්නාරමේ ධීවරයන්ට අනතුරු අගවයි", "inandīya jātikayan samaga ekvana manannāramē dhīvarayanaṇṭa anaturu agavayi"
53
+ test "තේ නැවත වගාවට පෙර පස පුනරුත්ථාපනයට කෙටි මග", "tē năvata vagāvaṭa pera pasa punarutanthāpanayaṭa keṭi maga"
54
+ }
55
+
56
+ dependency "alalc-sin-Sinh-Latn-1997", as: sinhlatn
57
+
58
+ stage {
59
+
60
+ run map.sinhlatn.stage.main
61
+
62
+ }
63
+
@@ -0,0 +1,124 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Serbian and Makedonian Romanization, ALA-LC 1997 System
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/serbian.pdf
9
+ creation_date: 1997
10
+ description: ALA-LC Romanization table for Serbian and Makedonian.
11
+
12
+ notes:
13
+ - Special characters in romanization
14
+ Đ - D with crossbar (upper case). USMARC hexadecimal code A3.
15
+ đ - d with crossbar (upper case). USMARC hexadecimal code B3.
16
+
17
+ - Character modifiers in romanization
18
+ ´ - acute. USMARC hexadecimal code E2.
19
+ ˇ - hachek. USMARC hexadecimal code E9.
20
+ }
21
+
22
+ tests {
23
+ test "Општина Ердут", "Opština Erdut"
24
+ test "Општина Двор", "Opština Dvor"
25
+ test "ЛУЃЕ луѓе", "LUǴE luǵe"
26
+ test "ЅВЕЗДА ѕвезда Ѕвезда", "DZVEZDA dzvezda Dzvezda"
27
+ test "ЌАРУВАЊЕ ќарување", "ḰARUVANJE ḱaruvanje"
28
+ }
29
+
30
+ dependency "posix", import: true
31
+
32
+ stage {
33
+
34
+
35
+ # CHARACTERS
36
+ parallel {
37
+ sub "А", "A"
38
+ sub "Б", "B"
39
+ sub "В", "V"
40
+ sub "Г", "G"
41
+ sub "Ѓ", "Ǵ" # Ǵ
42
+ sub "Д", "D"
43
+ sub "Ђ", "Đ" # Đ
44
+ sub "Е", "E"
45
+ sub "Ж", "Ž" # Ž
46
+ sub "З", "Z"
47
+ sub "Ѕ", "Dz"
48
+ sub "И", "I"
49
+ sub "Ј", "J"
50
+ sub "К", "K"
51
+ sub "Ќ", "Ḱ" # Ḱ
52
+ sub "Л", "L"
53
+ sub "Љ", "Lj"
54
+ sub "М", "M"
55
+ sub "Н", "N"
56
+ sub "Њ", "Nj"
57
+ sub "О", "O"
58
+ sub "П", "P"
59
+ sub "Р", "R"
60
+ sub "С", "S"
61
+ sub "Т", "T"
62
+ sub "Ћ", "Ć" # Ć
63
+ sub "У", "U"
64
+ sub "Ф", "F"
65
+ sub "Х", "H"
66
+ sub "Ц", "C"
67
+ sub "Ч", "Č" # Č
68
+ sub "Џ", "Dž" # Dž
69
+ sub "Ш", "Š" # Š
70
+ sub "а", "a"
71
+ sub "б", "b"
72
+ sub "в", "v"
73
+ sub "г", "g"
74
+ sub "ѓ", "ǵ" # ǵ
75
+ sub "д", "d"
76
+ sub "ђ", "đ" # đ
77
+ sub "е", "e"
78
+ sub "ж", "ž" # ž
79
+ sub "з", "z"
80
+ sub "ѕ", "dz"
81
+ sub "и", "i"
82
+ sub "ј", "j"
83
+ sub "к", "k"
84
+ sub "ќ", "ḱ" # ḱ
85
+ sub "л", "l"
86
+ sub "љ", "lj"
87
+ sub "м", "m"
88
+ sub "н", "n"
89
+ sub "њ", "nj"
90
+ sub "о", "o"
91
+ sub "п", "p"
92
+ sub "р", "r"
93
+ sub "с", "s"
94
+ sub "т", "t"
95
+ sub "ћ", "ć" # ć
96
+ sub "у", "u"
97
+ sub "ф", "f"
98
+ sub "х", "h"
99
+ sub "ц", "c"
100
+ sub "ч", "č" # č
101
+ sub "џ", "dž" # dž
102
+ sub "ш", "š" # š
103
+ }
104
+ # POSTRULES
105
+ # rewritten by hand to work properly
106
+ # DZ
107
+ sub capture(maybe(upper)) + "Dz" + capture(upper), ref(1) + "DZ" + ref(2)
108
+ sub capture(upper) + "Dz" + capture(maybe(upper)), ref(1) + "DZ" + ref(2)
109
+
110
+ #LJ
111
+ sub capture(upper) + "Lj" + capture(maybe(upper)), ref(1) + "LJ" + ref(2)
112
+ sub capture(maybe(upper)) + "Lj" + capture(upper), ref(1) + "LJ" + ref(2)
113
+
114
+ #NJ
115
+ sub capture(upper) + "Nj" + capture(maybe(upper)), ref(1) + "NJ" + ref(2)
116
+ sub capture(maybe(upper)) + "Nj" + capture(upper), ref(1) + "NJ" + ref(2)
117
+
118
+ #DŽ
119
+ sub capture(upper) + "Dž" + capture(maybe(upper)), ref(1) + "DŽ" + ref(2)
120
+ sub capture(maybe(upper)) + "Dž" + capture(upper), ref(1) + "DŽ" + ref(2)
121
+
122
+ compose
123
+ }
124
+
@@ -0,0 +1,115 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2013
4
+ language: iso-639-2:srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF SERBIAN, ALA-LC 2013 System
8
+ url: https://www.loc.gov/catdir/cpso/romanization/serbian.pdf
9
+ creation_date: 2013
10
+ description: |
11
+ Serbian uses the Cyrillic and Roman alphabets. When the Roman alphabet is used it is the same as Croatian.
12
+ }
13
+
14
+ tests {
15
+ test "Шупља Стена", "Šuplja Stena"
16
+ test "Чукарица", "Čukarica"
17
+ test "Црна Трава", "Crna Trava"
18
+ test "Херцег Нови", "Herceg Novi"
19
+ test "Улцињ", "Ulcinj"
20
+ test "Ужице", "Užice"
21
+ test "Тресаначка Река", "Tresanačka Reka"
22
+ test "Сјеница", "Sjenica"
23
+ test "Рожаје", "Rožaje"
24
+ test "Пљевља", "Pljevlja"
25
+ test "Оџаци", "Odžaci"
26
+ test "Никшић", "Nikšić"
27
+ test "Медвеђа", "Medveđa"
28
+ test "Лозница", "Loznica"
29
+ test "Књажевац", "Knjaževac"
30
+ test "Зрењанин", "Zrenjanin"
31
+ test "Житорађа", "Žitorađa"
32
+ test "Ервеник", "Ervenik"
33
+ test "Доње Љупче", "Donje Ljupče"
34
+ test "Гусиње", "Gusinje"
35
+ test "ГУСИЊЕ", "GUSINJE"
36
+ test "Врњачка Бања", "Vrnjačka Banja"
37
+ test "Бијело Поље", "Bijelo Polje"
38
+ test "Алибунар", "Alibunar"
39
+ }
40
+
41
+ aliases {
42
+ def_alias srp_multichar, any(["Lj", "Nj", "Dž"])
43
+ def_alias srp_latupper, any("A".."Z")
44
+ }
45
+
46
+ stage {
47
+ # CHARACTERS
48
+ parallel {
49
+ sub "А", "A"
50
+ sub "Б", "B"
51
+ sub "В", "V"
52
+ sub "Г", "G"
53
+ sub "Д", "D"
54
+ sub "Ђ", "Đ" # Đ
55
+ sub "Е", "E"
56
+ sub "Ж", "Ž" # Ž
57
+ sub "З", "Z"
58
+ sub "И", "I"
59
+ sub "Ј", "J"
60
+ sub "К", "K"
61
+ sub "Л", "L"
62
+ sub "Љ", "Lj"
63
+ sub "М", "M"
64
+ sub "Н", "N"
65
+ sub "Њ", "Nj"
66
+ sub "О", "O"
67
+ sub "П", "P"
68
+ sub "Р", "R"
69
+ sub "С", "S"
70
+ sub "Т", "T"
71
+ sub "Ћ", "Ć" # Ć
72
+ sub "У", "U"
73
+ sub "Ф", "F"
74
+ sub "Х", "H"
75
+ sub "Ц", "C"
76
+ sub "Ч", "Č" # Č
77
+ sub "Џ", "Dž" # Dž
78
+ sub "Ш", "Š" # Š
79
+ sub "а", "a"
80
+ sub "б", "b"
81
+ sub "в", "v"
82
+ sub "г", "g"
83
+ sub "д", "d"
84
+ sub "ђ", "đ" # đ
85
+ sub "е", "e"
86
+ sub "ж", "ž" # ž
87
+ sub "з", "z"
88
+ sub "и", "i"
89
+ sub "ј", "j"
90
+ sub "к", "k"
91
+ sub "л", "l"
92
+ sub "љ", "lj"
93
+ sub "м", "m"
94
+ sub "н", "n"
95
+ sub "њ", "nj"
96
+ sub "о", "o"
97
+ sub "п", "p"
98
+ sub "р", "r"
99
+ sub "с", "s"
100
+ sub "т", "t"
101
+ sub "ћ", "ć" # ć́
102
+ sub "у", "u"
103
+ sub "ф", "f"
104
+ sub "х", "h"
105
+ sub "ц", "c"
106
+ sub "ч", "č" # č
107
+ sub "џ", "dž" # dž
108
+ sub "ш", "š" # š
109
+ }
110
+
111
+ # POSTRULES
112
+ sub srp_multichar, upcase, before: srp_latupper
113
+ sub srp_multichar, upcase, after: srp_latupper
114
+ compose
115
+ }
@@ -0,0 +1,52 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:tam
5
+ source_script: Taml
6
+ destination_script: Latn
7
+ name: Tamil Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/tamil.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Tamil
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
25
+
26
+ - This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
27
+ }
28
+
29
+ tests {
30
+ test "அழிந்து போன நகரத்தில் , தொலைந்து போன நான்", "aḻintu pōṉa nakarattil , tolaintu pōṉa nāṉ"
31
+ test "முதன் முதலாக - மை ஃபர்ஸ்ட் சோலோ ட்ராவல்", "mutaṉ mutalāka - mai ḵaparsṭ cōlō ṭrāval"
32
+ test "வாழ்க்கையில் அவன் போன முதல் சோலோ டிரிப் அது தான்.", "vāḻkkaiyil avaṉ pōṉa mutal cōlō ṭirip atu tāṉ."
33
+ test "ஸ்கூல் ப்ரெண்ட் கார்த்திக் வீட்டுக்கு போய்ட்டு", "skūl preṇṭ kārttik vīṭṭukku pōyṭṭu"
34
+ test "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ", "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
35
+ test "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ", "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
36
+ test "டார்பிடோவை ஏவ உதவும் சூப்பர்சானிக் ஏவுகணையான ஸ்மார்ட் சோதனை வெற்றி", "ṭārpiṭōvai ēva utavum cūpparcāṉik ēvukaṇaiyāṉa smārṭ cōtaṉai veṟṟi"
37
+ test "இந்த ஆண்டு மருத்துவத்துக்கான நோபல் பரிசு பெறுபவர்களின் பெயர்கள் அறிவிப்பு", "inta āṇṭu maruttuvattukkāṉa nōpal paricu peṟupavarkaḷiṉ peyarkaḷ aṟivippu"
38
+ test "மல்லையா விவகாரம்: பிரிட்டன் அரசின் நடவடிக்கைகள் தங்களுக்கு தெரியவில்லை - மத்திய அரசு தகவல்", "mallaiyā vivakāram: piriṭṭaṉ araciṉ naṭavaṭikkaikaḷ taṅkaḷukku teriyavillai - mattiya aracu takaval"
39
+ test "ஆலோசனைக்குப் பிறகு தேனியில் இருந்து சென்னை புறப்பட்டார் துணை முதலமைச்சர் பன்னீர்செல்வம்", "ālōcaṉaikkup piṟaku tēṉiyil iruntu ceṉṉai puṟappaṭṭār tuṇai mutalamaiccar paṉṉīrcelvam"
40
+ test "இன்று தான் பேரன் பிறந்தநாள் முடிந்து ஃப்ரீ ஆகி இருக்கிறேன்", "iṉṟu tāṉ pēraṉ piṟantanāḷ muṭintu ḵaprī āki irukkiṟēṉ"
41
+ }
42
+
43
+ dependency "din-tam-Taml-Latn-33903-2016", as: tamllatn
44
+
45
+ stage {
46
+ # CHARACTERS
47
+ parallel {
48
+ sub "ஃ", "ḵa"
49
+ }
50
+
51
+ run map.tamllatn.stage.main
52
+ }
@@ -0,0 +1,49 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2011
4
+ language: iso-639-2:tam
5
+ source_script: Taml
6
+ destination_script: Latn
7
+ name: Tamil Romanization, 2011
8
+ url: https://www.loc.gov/catdir/cpso/romanization/tamil.pdf
9
+ creation_date: 2011
10
+ description: |
11
+ ALA-LC Romanization table for Tamil
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
25
+
26
+ - This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
27
+ }
28
+
29
+ tests {
30
+ test "மலையாள நடிகர் சங்கத்திலிருந்து நடிகை பார்வதி திடீர் விலகல்.", "malaiyāḷa naṭikar caṅkattiliruntu naṭikai pārvati tiṭīr vilakal."
31
+ test "சச்சின் டெண்டுல்கரை அலுவலக உதவியாளராக நியமிப்பீர்களா?", "cacciṉ ṭeṇṭulkarai aluvalaka utaviyāḷarāka niyamippīrkaḷā?"
32
+ test "அமீரகத்தில் தொலைநோக்கி இல்லாமல் நாளை பார்க்கலாம்", "amīrakattil tolainōkki illāmal nāḷai pārkkalām"
33
+ test "லடாக் யூனியன் பிரதேசம் இந்தியா சட்டவிரோதமாக நிறுவிய ஒரு பகுதி- சீனா மீண்டும் பிடிவாதம்", "laṭāk yūṉiyaṉ piratēcam intiyā caṭṭavirōtamāka niṟuviya oru pakuti- cīṉā mīṇṭum piṭivātam"
34
+ test "பாலியல் குற்றங்களில் ஈடுபடுவோருக்கு மரண தண்டனை புதிய சட்டம்", "pāliyal kuṟṟaṅkaḷil īṭupaṭuvōrukku maraṇa taṇṭaṉai putiya caṭṭam"
35
+ test "புதுடெல்லி", "putuṭelli"
36
+ test "அப்படி விளம்பரத்தில என்ன இருக்கு...?", "appaṭi viḷamparattila eṉṉa irukku...?"
37
+ test "பூமிக்கும், செவ்வாய் கிரகத்துக்கும் இடையிலான அதிகபட்ச தூரம் ௪௦ கோடியே ௧௩ லட்சம் கி.மீ தொலைவு ஆகும்.", "pūmikkum, cevvāy kirakattukkum iṭaiyilāṉa atikapaṭca tūram 40 kōṭiyē 13 laṭcam ki.mī tolaivu ākum."
38
+ test "அமீரகத்தில் செவ்வாய் கிரகம் குறித்த ஆய்வில் ஈடுபடுவோர் மற்றும் வானியல் நிபுணர்களுக்கு இது ஒரு நல்ல வாய்ப்பாக அமையும்.", "amīrakattil cevvāy kirakam kuṟitta āyvil īṭupaṭuvōr maṟṟum vāṉiyal nipuṇarkaḷukku itu oru nalla vāyppāka amaiyum."
39
+ test "நள்ளிரவு நேரமாக இருந்தால் நமது தலைக்கு மேலே காணலாம். காலை நேரத்தில் மேற்கு மற்றும் தென்மேற்கு திசையில் செவ்வாய் கிரகத்தை பார்க்கலாம்.", "naḷḷiravu nēramāka iruntāl namatu talaikku mēlē kāṇalām. kālai nērattil mēṟku maṟṟum teṉmēṟku ticaiyil cevvāy kirakattai pārkkalām."
40
+ test "வெறும் கண்ணால் பார்க்கும்போது புள்ளியாக ஆரஞ்சு நிறத்தில் பிரகாசமாக தெரியும்.", "veṟum kaṇṇāl pārkkumpōtu puḷḷiyāka ārañcu niṟattil pirakācamāka teriyum."
41
+ }
42
+
43
+ dependency "alalc-tam-Taml-Latn-1997", as: tamllatn
44
+
45
+ stage {
46
+
47
+ run map.tamllatn.stage.main
48
+
49
+ }
@@ -0,0 +1,237 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:tel
5
+ source_script: Telu
6
+ destination_script: Latn
7
+ name: Telugu Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/telugu.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Telugu
12
+
13
+ notes:
14
+
15
+ - |
16
+ Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
17
+ vowels following a consonant can be found in grammars; no distinction between the two is
18
+ made in transliteration.
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+ a) when another vowel is indicated by its appropriate sign; and
23
+ b) when the absence of any vowel is indicated by the superscript sign ( ౬ ) called valapalagilaka.
24
+ - |
25
+ Exception: Sunna is transliterated by:
26
+ a) ṅ before gutturals,
27
+ b) ñ before palatals,
28
+ c) ṇ before cerebrals,
29
+ d) n before dentals, and
30
+ e) m before labials.
31
+ - |
32
+ Ardhasunna before gutturals and palatal, cerebral, and dental occlusives is transliterated n̐.
33
+ Before labials, sibilants, semivowels, the aspirate, vowels, and in final position it is
34
+ transliterated m
35
+ }
36
+
37
+ tests {
38
+ test "తమిళనాడు", "tamiḷanāḍu"
39
+ test "తంటికొండ ఘటన: ఆగని మృత్యుఘోష", "taṃṭikoṇḍa ghaṭana: āgani mṛtayughŏṣa"
40
+ test "మళ్లీ వివాదం: అమితాబ్‌పై కేసు", "maḷalī vivādaṃ: amitābapai kēsu"
41
+ test "‘వరద సాయం పేరుతో వైట్ కాలర్ దోపిడీ’", "‘varada sāyaṃ pērutŏ vaiṭa kālara dŏpiḍī’"
42
+ test "రెండో విడత జీఎస్టీ పరిహారం", "reṃḍŏ viḍata jīesaṭī parihāraṃ"
43
+ test "నితీష్‌ కుమార్‌ అధ్యాయం ముగిసినట్లేనా?!", "nitīṣa kumāra adhayāyaṃ mugisinaṭalēnā?!"
44
+ test "వారిపై జీవితాంతం నిషేధం విధించండి!", "vāripai jīvitāntaṃ niṣēdhaṃ vidhiñcaṃḍi!"
45
+ test "మరో లాక్‌డౌన్‌ వల్ల అన్నీ అనర్థాలే!", "marŏ lākaḍauna valala ananī anarathālē!"
46
+ test "జెసిండా మరో సంచలనం", "jesiṃḍā marŏ sañcalanaṃ"
47
+ test "స్వీయ నిర్బంధంలోకి డబ్ల్యూహెచ్‌ఓ డైరెక్టర్‌", "savīya nirabandhaṃlŏki ḍabalayūhecaō ḍairekaṭara"
48
+ test "కరోనాపై యుద్ధంలో సమిధలు", "karŏnāpai yudadhaṃlŏ samidhalu"
49
+ test "అమెరికా ఎన్నికలు: ‘పెద్దన్న’ ఎవరో?!", "amerikā enanikalu: ‘pedadanana’ evarŏ?!"
50
+ test "౪౬౨౬౯", "46269"
51
+ }
52
+
53
+ aliases {
54
+ def_alias telu_chars_1, any("\u0c3e\u0c3f\u0c40\u0c41\u0c42\u0c43\u0c46\u0c47\u0c48\u0c4a\u0c4b\u0c4c\u0c6c")
55
+ }
56
+
57
+ stage {
58
+
59
+ # RULES
60
+ # rule II
61
+ sub "క", "k", after: telu_chars_1
62
+ sub "ఖ", "kh", after: telu_chars_1
63
+ sub "గ", "g", after: telu_chars_1
64
+ sub "ఘ", "gh", after: telu_chars_1
65
+ sub "ఙ", "ṅ", after: telu_chars_1
66
+ sub "చ", "c", after: telu_chars_1
67
+ sub "ౘ", "ĉ", after: telu_chars_1
68
+ sub "ఛ", "ch", after: telu_chars_1
69
+ sub "జ", "j", after: telu_chars_1
70
+ sub "ౙ", "ĵ", after: telu_chars_1
71
+ sub "ఝ", "jh", after: telu_chars_1
72
+ sub "ఞ", "ñ", after: telu_chars_1
73
+ sub "ట", "ṭ", after: telu_chars_1
74
+ sub "ఠ", "ṭh", after: telu_chars_1
75
+ sub "డ", "ḍ", after: telu_chars_1
76
+ sub "ఢ", "ḍh", after: telu_chars_1
77
+ sub "ణ", "ṇ", after: telu_chars_1
78
+ sub "త", "t", after: telu_chars_1
79
+ sub "థ", "th", after: telu_chars_1
80
+ sub "ద", "d", after: telu_chars_1
81
+ sub "ధ", "dh", after: telu_chars_1
82
+ sub "న", "n", after: telu_chars_1
83
+ sub "ప", "p", after: telu_chars_1
84
+ sub "ఫ", "ph", after: telu_chars_1
85
+ sub "బ", "b", after: telu_chars_1
86
+ sub "భ", "bh", after: telu_chars_1
87
+ sub "మ", "m", after: telu_chars_1
88
+ sub "య", "y", after: telu_chars_1
89
+ sub "ర", "r", after: telu_chars_1
90
+ sub "ఱ", "ṛ", after: telu_chars_1
91
+ sub "ల", "l", after: telu_chars_1
92
+ sub "ళ", "ḷ", after: telu_chars_1
93
+ sub "వ", "v", after: telu_chars_1
94
+ sub "శ", "ś", after: telu_chars_1
95
+ sub "ష", "ṣ", after: telu_chars_1
96
+ sub "స", "s", after: telu_chars_1
97
+ sub "హ", "h", after: telu_chars_1
98
+
99
+ # rule III
100
+ sub "\u0C02", "ṅ", after: any("కఖగఘఙ")
101
+ sub "\u0C02", "ñ", after: any("చౘఛజౙఝఞ")
102
+ sub "\u0C02", "ṇ", after: any("టఠడఢణ")
103
+ sub "\u0C02", "n", after: any("తథదధన")
104
+ sub "\u0C02", "m", after: any("పఫబభమ")
105
+
106
+ # rule IV
107
+ sub "\u0C01", "n̐", after: any("కఖగఘఙచౘఛజౙఝఞటఠడఢణతథదధన") # before guttural, palatal, cerebral, and dental
108
+
109
+
110
+ # CHARACTERS
111
+ parallel {
112
+
113
+ sub "అ", "a"
114
+ sub "ఆ", "ā"
115
+ sub "ఇ", "i"
116
+ sub "ఈ", "ī"
117
+ sub "ఉ", "u"
118
+ sub "ఊ", "ū"
119
+ sub "ఋ", "ṛ"
120
+ sub "ౠ", "ṝ"
121
+ sub "ఌ", "ḻ"
122
+ sub "ఎ", "e"
123
+ sub "ఏ", "ē"
124
+ sub "ఐ", "ai"
125
+ sub "ఒ", "o"
126
+ sub "ఓ", "ō"
127
+ sub "ఔ", "au"
128
+
129
+ # Gutturals
130
+ sub "క", "ka"
131
+ sub "ఖ", "kha"
132
+ sub "గ", "ga"
133
+ sub "ఘ", "gha"
134
+ sub "ఙ", "ṅa"
135
+
136
+ # Palatals
137
+ sub "చ", "ca"
138
+ sub "ౘ", "ĉa"
139
+ sub "ఛ", "cha"
140
+ sub "జ", "ja"
141
+ sub "ౙ", "ĵa"
142
+ sub "ఝ", "jha"
143
+ sub "ఞ", "ña"
144
+
145
+ # Cerebrals
146
+ sub "ట", "ṭa"
147
+ sub "ఠ", "ṭha"
148
+ sub "డ", "ḍa"
149
+ sub "ఢ", "ḍha"
150
+ sub "ణ", "ṇa"
151
+
152
+ # Dentals
153
+ sub "త", "ta"
154
+ sub "థ", "tha"
155
+ sub "ద", "da"
156
+ sub "ధ", "dha"
157
+ sub "న", "na"
158
+
159
+ # Labials
160
+ sub "ప", "pa"
161
+ sub "ఫ", "pha"
162
+ sub "బ", "ba"
163
+ sub "భ", "bha"
164
+ sub "మ", "ma"
165
+
166
+ # Semivowels
167
+ sub "య", "ya"
168
+ sub "ర", "ra"
169
+ sub "ఱ", "ṛa"
170
+ sub "ల", "la"
171
+ sub "ళ", "ḷa"
172
+ sub "వ", "va"
173
+
174
+ # Sibilants
175
+ sub "శ", "śa"
176
+ sub "ష", "ṣa"
177
+ sub "స", "sa"
178
+
179
+
180
+
181
+ # Aspirate
182
+ sub "హ", "ha"
183
+
184
+
185
+
186
+ # Chandrabindu
187
+ sub "ঁ", "m̐"
188
+ sub "ఁ", "m̐"
189
+
190
+ # Bisarga
191
+ sub "ః", "ḥ"
192
+
193
+ # Anusvāra
194
+ sub "ం", "ṃ"
195
+
196
+ # Medials # Needed for connecting constants
197
+
198
+ sub "ా", "ā"
199
+ sub "ి", "i"
200
+ sub "ీ", "ī"
201
+ sub "ు", "u"
202
+ sub "ూ", "ū"
203
+ sub "ృ", "ṛ"
204
+ sub "ె", "e"
205
+ sub "ే", "ē"
206
+ sub "ై", "ai"
207
+ sub "ొ", "o"
208
+ sub "ో", "ŏ"
209
+ sub "ౌ", "au"
210
+ sub "\u09CD", "" # Used for joining
211
+
212
+
213
+ sub "\u0c4d", "" #verma sign for halanta
214
+ sub "ౕ\t", ""
215
+ sub "ౖ\t", ""
216
+ sub "्", ""
217
+ sub "़", ""
218
+ sub "‍", "" # Used for joining
219
+ sub "‌", "" # Used for non joining
220
+
221
+ # numbers
222
+
223
+ sub "౦", "0"
224
+ sub "౧", "1"
225
+ sub "౨", "2"
226
+ sub "౩", "3"
227
+ sub "౪", "4"
228
+ sub "౫", "5"
229
+ sub "౬", "6"
230
+ sub "౭", "7"
231
+ sub "౮", "8"
232
+ sub "౯", "9"
233
+ }
234
+
235
+ compose
236
+ }
237
+