interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,140 @@
1
+ metadata {
2
+ authority_id: iso
3
+ id: 1996-method1
4
+ language: iso-639-2:kor
5
+ source_script: Hang
6
+ destination_script: Latn
7
+ name: ISO/TR 11941:1996 Information and documentation — Transliteration of Korean script into Latin characters
8
+ url: https://www.iso.org/standard/20564.html
9
+ creation_date: 1996
10
+ adoption_date: ""
11
+ description: |
12
+ Establishes a system for the transliteration of the characters of Korean script into Latin characters.
13
+ Intended to provide a means for international communication of written documents.
14
+
15
+ notes: []
16
+ }
17
+
18
+ tests {
19
+ # Tests from https://www.eki.ee/wgrs/rom2_ko.pdf
20
+ test "꽃이", "kkoch'i" # Bad OCR
21
+ test "강에", "kang'e"
22
+ test "앉아라", "anc'ara"
23
+ test "아까", "a'kka"
24
+ test "흰떡", "hyin'tteok"
25
+ test "유쾌하다", "yu'khwaehata"
26
+
27
+ # Tests from https://github.com/interscript/interscript/files/5249245/ISO-TR-11941-1996.pdf
28
+ test "애기", "aeki"
29
+ test "방", "pang"
30
+ test "아이", "a'i"
31
+ test "고양이", "ko'yang'i"
32
+ test "굽이", "kup'i"
33
+ test "밖에", "pakk'e"
34
+ test "박게", "pakke"
35
+ test "바께", "pa'kke"
36
+ test "간게", "kanke"
37
+ test "안자라", "ancara"
38
+ test "오빠", "o'ppa"
39
+ test "어찌", "eo'cci"
40
+ test "아씨", "a'ssi"
41
+ test "애타다", "ae'thata"
42
+ test "아프다", "a'pheuta"
43
+ test "기차다", "ki'chata"
44
+ test "동녘에", "tongnyeokh'e"
45
+ test "같이", "kath'i"
46
+ test "앞에", "aph'e"
47
+ test "꽃에", "kkoch'e"
48
+ }
49
+
50
+ dependency "var-kor", import: true
51
+ dependency "var-kor-Hang-Hang-jamo", as: hangjamo
52
+
53
+ stage {
54
+ run map.hangjamo.stage.main
55
+
56
+ # Marks A, B, C
57
+ sub "ᄋ", "", not_before: jamo # Word initially
58
+ sub "ᄋ", "'" # See notes 2, 3 and 4.
59
+ sub "ᆼ", "ng" # At the end of a syllable.
60
+
61
+ # Note 4: add apostrophe before 5 double consonants at initial position
62
+ # unless start of the word
63
+ sub none, "'", before: jamo, after: double_cons_jamo
64
+ # Note 4: (only method 1) same but with 4 aspirated
65
+ sub none, "'", before: jamo, after: aspirated_cons_jamo
66
+
67
+ # Those rules may be executed in parallel for performance gains
68
+ parallel {
69
+ # Consonants differing between method1 and method2
70
+ sub any("ᄀᆨ"), "k"
71
+ sub any("ᄏᆿ"), "kh"
72
+ sub any("ᄁᆩ"), "kk"
73
+ sub any("ᄃᆮ"), "t"
74
+ sub any("ᄐᇀ"), "th"
75
+ sub any("ᄄퟍ"), "tt"
76
+ sub any("ᄇᆸ"), "p"
77
+ sub any("ᄑᇁ"), "ph"
78
+ sub any("ᄈퟦ"), "pp"
79
+ sub any("ᄌᆽ"), "c"
80
+ sub any("ᄎᆾ"), "ch"
81
+ sub any("ᄍퟹ"), "cc"
82
+ # End
83
+
84
+ # Composite differing consonants (cons. https://en.wikipedia.org/wiki/ISO/TR_11941
85
+ sub "ᆪ", "ks"
86
+ sub "ꥤ", "rk" # D. R at the beginning of a syllable
87
+ sub "ᆰ", "lk"
88
+ sub "ᆴ", "lth"
89
+ sub "ꥩ", "rp" # D. R at the beginning of a syllable
90
+ sub "ᆲ", "lp"
91
+ sub "ᆵ", "lph"
92
+ sub any("ᅜᆬ"), "nc"
93
+ sub any("ᄡᆹ"), "ps"
94
+ # End
95
+
96
+ # Other consonants
97
+ sub any("ᄉᆺ"), "s"
98
+ sub any("ᄊᆻ"), "ss"
99
+ sub any("ᄒᇂ"), "h"
100
+ sub any("ᄂᆫ"), "n"
101
+ sub "ᄅ", "r" # D. R at the beginning of a syllable.
102
+ sub "ᆯ", "l"
103
+ sub any("ᄆᆷ"), "m"
104
+ # End
105
+
106
+ # Other composite consonants (cons. https://en.wikipedia.org/wiki/ISO/TR_11941 )
107
+ sub "ꥬ", "rs" # D. R at the beginning of a syllable
108
+ sub "ᆳ", "ls"
109
+ sub "ꥨ", "rm" # D. R at the beginning of a syllable
110
+ sub "ᆱ", "lm"
111
+ sub "ᄚ", "rh" # D. R at the beginning of a syllable
112
+ sub "ᆶ", "lh"
113
+ sub any("ᅝᆭ"), "nh"
114
+ # End
115
+
116
+ # Vowels
117
+ sub "ᅡ", "a"
118
+ sub "ᅥ", "eo"
119
+ sub "ᅩ", "o"
120
+ sub "ᅮ", "u"
121
+ sub "ᅳ", "eu"
122
+ sub "ᅵ", "i"
123
+ sub "ᅢ", "ae"
124
+ sub "ᅦ", "e"
125
+ sub "ᅬ", "oe"
126
+ sub "ᅣ", "ya"
127
+ sub "ᅧ", "yeo"
128
+ sub "ᅭ", "yo"
129
+ sub "ᅲ", "yu"
130
+ sub "ᅤ", "yae"
131
+ sub "ᅨ", "ye"
132
+ sub "ᅪ", "wa"
133
+ sub "ᅯ", "weo"
134
+ sub "ᅱ", "wi"
135
+ sub "ᅫ", "wae"
136
+ sub "ᅰ", "we"
137
+ sub "ᅴ", "yi"
138
+ # End
139
+ }
140
+ }
@@ -0,0 +1,132 @@
1
+ metadata {
2
+ authority_id: iso
3
+ id: 1996-method2
4
+ language: iso-639-2:kor
5
+ source_script: Hang
6
+ destination_script: Latn
7
+ name: "ISO/TR 11941:1996 Information and documentation — Transliteration of Korean script into Latin characters"
8
+ url: https://www.iso.org/standard/20564.html
9
+ creation_date: 1996
10
+ adoption_date:
11
+ description: Establishes a system for the transliteration of the characters of Korean script into Latin characters. Intended to provide a means for international communication of written documents.
12
+
13
+ notes: ""
14
+ }
15
+
16
+ tests {
17
+ # Tests from https://www.eki.ee/wgrs/rom2_ko.pdf
18
+ test "꽃이", "ggoc'i" # Bad OCR
19
+ test "강에", "gang'e"
20
+ test "앉아라", "anj'ara"
21
+ test "아까", "a'gga"
22
+ test "흰떡", "hyin'ddeog"
23
+ #- source: "유쾌하다" not present in method2
24
+ # expected: "yu'khwaehata"
25
+ # Tests from https://github.com/interscript/interscript/files/5249245/ISO-TR-11941-1996.pdf
26
+ test "애기", "aegi"
27
+ test "방", "bang"
28
+ test "아이", "a'i"
29
+ test "고양이", "go'yang'i"
30
+ test "굽이", "gub'i"
31
+ test "밖에", "bagg'e"
32
+ test "박게", "bagge"
33
+ test "바께", "ba'gge"
34
+ test "간게", "gange"
35
+ test "안자라", "anjara"
36
+ test "오빠", "o'bba"
37
+ test "어찌", "eo'jji"
38
+ test "아씨", "a'ssi"
39
+ }
40
+
41
+ dependency "var-kor", import: true
42
+ dependency "var-kor-Hang-Hang-jamo", as: hangjamo
43
+
44
+
45
+ stage {
46
+ run map.hangjamo.stage.main
47
+
48
+ # Marks A, B, C
49
+ sub "ᄋ", "", not_before: jamo # Word initially
50
+ sub "ᄋ", "'" # See notes 2, 3 and 4.
51
+ sub "ᆼ", "ng" # At the end of a syllable.
52
+
53
+ # Note 4: add apostrophe before 5 double consonants at initial position
54
+ # unless start of the word
55
+ sub none, "'", before: jamo, after: double_cons_jamo
56
+ # Note 4: (only method 1) same but with 4 aspirated
57
+ #- pattern: "(?<=\\p{Hangul})([ᄏᄐᄑᄎ])"
58
+ # result: "'\\1"
59
+
60
+ parallel {
61
+ # Consonants differing between method1 and method2
62
+ sub any("ᄀᆨ"), "g"
63
+ sub any("ᄏᆿ"), "k"
64
+ sub any("ᄁᆩ"), "gg"
65
+ sub any("ᄃᆮ"), "d"
66
+ sub any("ᄐᇀ"), "t"
67
+ sub any("ᄄퟍ"), "dd"
68
+ sub any("ᄇᆸ"), "b"
69
+ sub any("ᄑᇁ"), "p"
70
+ sub any("ᄈퟦ"), "bb"
71
+ sub any("ᄌᆽ"), "j"
72
+ sub any("ᄎᆾ"), "c"
73
+ sub any("ᄍퟹ"), "jj"
74
+ # End
75
+
76
+ # Composite differing consonants (cons. https://en.wikipedia.org/wiki/ISO/TR_11941 )
77
+ sub any("ᆪ"), "gs"
78
+ sub any("ꥤ"), "rg" # D. R at the beginning of a syllable
79
+ sub any("ᆰ"), "lg"
80
+ sub any("ᆴ"), "lt"
81
+ sub any("ꥩ"), "rb" # D. R at the beginning of a syllable
82
+ sub any("ᆲ"), "lb"
83
+ sub any("ᆵ"), "lp"
84
+ sub any("ᅜᆬ"), "nj"
85
+ sub any("ᄡᆹ"), "bs"
86
+ # End
87
+
88
+ # Other consonants
89
+ sub any("ᄉᆺ"), "s"
90
+ sub any("ᄊᆻ"), "ss"
91
+ sub any("ᄒᇂ"), "h"
92
+ sub any("ᄂᆫ"), "n"
93
+ sub any("ᄅ"), "r" # D. R at the beginning of a syllable.
94
+ sub any("ᆯ"), "l"
95
+ sub any("ᄆᆷ"), "m"
96
+ # End
97
+
98
+ # Other composite consonants (cons. https://en.wikipedia.org/wiki/ISO/TR_11941 )
99
+ sub any("ꥬ"), "rs" # D. R at the beginning of a syllable
100
+ sub any("ᆳ"), "ls"
101
+ sub any("ꥨ"), "rm" # D. R at the beginning of a syllable
102
+ sub any("ᆱ"), "lm"
103
+ sub any("ᄚ"), "rh" # D. R at the beginning of a syllable
104
+ sub any("ᆶ"), "lh"
105
+ sub any("ᅝᆭ"), "nh"
106
+ # End
107
+
108
+ # Vowels
109
+ sub "ᅡ", "a"
110
+ sub "ᅥ", "eo"
111
+ sub "ᅩ", "o"
112
+ sub "ᅮ", "u"
113
+ sub "ᅳ", "eu"
114
+ sub "ᅵ", "i"
115
+ sub "ᅢ", "ae"
116
+ sub "ᅦ", "e"
117
+ sub "ᅬ", "oe"
118
+ sub "ᅣ", "ya"
119
+ sub "ᅧ", "yeo"
120
+ sub "ᅭ", "yo"
121
+ sub "ᅲ", "yu"
122
+ sub "ᅤ", "yae"
123
+ sub "ᅨ", "ye"
124
+ sub "ᅪ", "wa"
125
+ sub "ᅯ", "weo"
126
+ sub "ᅱ", "wi"
127
+ sub "ᅫ", "wae"
128
+ sub "ᅰ", "we"
129
+ sub "ᅴ", "yi"
130
+ # End
131
+ }
132
+ }
@@ -0,0 +1,276 @@
1
+ metadata {
2
+ authority_id: iso
3
+ id: 15919-2001
4
+ language: iso-639-2:mal
5
+ source_script: Mlym
6
+ destination_script: Latn
7
+ name: "Information and documentation — Transliteration of Devanagari and related Indic scripts into Latin characters"
8
+ url: https://www.chatranjali.fr/Scripts/Standards/ISO15919.pdf
9
+ creation_date: 2001
10
+ adoption_date: 2001
11
+ description: |
12
+ Script conversion is often required for documents such as historical and literary texts, geographical texts (including
13
+ maps and atlases), bibliographies, catalogues, lists and passports (and other identification documents).
14
+
15
+ Text in Devanagari script or other Indic scripts sometimes needs to be shown in Latin script, where users, or
16
+ equipment that they are using, cannot read or write the text
17
+
18
+ This International Standard applies to transliteration of Devanagari, and to Indic scripts related to Devanagari,
19
+ independent of the period in which it is or was used.
20
+
21
+ notes:
22
+
23
+ - All transliterations made using this International Standard shall be case-insensitive.
24
+ - Inherent a with a consonant shall always be transliterated.
25
+ - Malayalam anusvara final in a word shall be transliterated as m .
26
+ - candrabindu shall be transliterated as m̐
27
+ - When m̐, ṃ or ṁ are associated with a vowel, they shall be placed after the vowel. When m̐ is associated
28
+ with a semivowel, it shall be placed before the semivowel.
29
+ - Latin punctuation signs and Hindu-Arabic numerals shall remain unchanged in transliteration.
30
+ Indic punctuation is outside the scope of this International Standard.
31
+ - The Vedic accent Udatta shall be transliterated as an acute accent over the transliterated vowel, and the
32
+ independent Svarita as a grave accent over the transliterated vowel. In the case of the digraphs ai, au, the accent
33
+ shall be attached to the second vowel.
34
+ - |
35
+ A colon: before a Latin character shall be used to resolve ambiguity. Some normative cases are as
36
+ follows.
37
+ - :’ for avagraha in modern text. (The apostrophe in modern text remains unchanged in accordance with previous rule.
38
+ - Pure consonant ( cillŭ form) in Malayalam script, other than r/ṟ (ർ), before a consonant, as in n:na formed with a
39
+ pure consonant (not the ligature nna). Medial ൕ in Malayalam text shall be treated as a pure consonant ( cillŭ
40
+ form).
41
+ - If a character in an Indic script is defined in such a way as to be equivalent to another character in any
42
+ script, where the second character has a transliteration in this International Standard, then the first character shall
43
+ be transliterated in the same way as the second character.
44
+ - When the half-nasal in Telugu script is used for modern nasalization in writing Hindi or
45
+ any other language, it shall be transliterated as a tilde above the transliterated vowel. In the case of the digraphs ai,
46
+ au, the tilde shall be attached to the second vowel
47
+ - Where it is desired to show the Vedic accent Anudatta, it should be transliterated as an underscore. In the case of
48
+ the digraphs ai, au, both Latin vowels should be underscored.
49
+ Where word boundaries are not shown in the original text (as happens commonly in Sanskrit) and a word ends in a
50
+ consonant, the transliteration should show word division by a space; but when phonological processes result in two
51
+ words sharing a common vowel, no attempt should be made to separate them. This will require a good knowledge
52
+ of the language in question.
53
+ - In Malayalam text, ് acts as the mātrā for ŭ when final in a word, except when it removes the inherent vowel of a single
54
+ consonant.
55
+ - The ambiguous pure consonant r/ṟ (ർ) in Malayalam script shall be transliterated into r when combined
56
+ with another consonant; when it is final in a word it shall be transliterated as ṟ in Malayalam language.
57
+ }
58
+
59
+ tests {
60
+ test "സ്വപ്നയ്ക്കൊപ്പം ഹോട്ടലിൽ മന്ത്രിപുത്രൻ, ചിത്രങ്ങൾ; ൪ കോടി കമ്മിഷനിലും പങ്കുപറ്റി", "svapnaykkaeāppam haōṭṭalai:la mantraipautra:ṇa, caitraṅṅa:ḷa; 4 kaōṭai kammaiṣanailaum paṅkaupaṟṟai"
61
+ test "വിവാദങ്ങളിൽ മാപ്പില്ല, ആദ്യമായി ഐപിഎൽ കമന്ററിക്കില്ലാതെ മ‍ഞ്ജരേക്കര്‍; പുറത്ത് തന്നെ", "vaivaādaṅṅaḷai:la maāppailla, ādyamaāyai aipaie:la kamanṟaṟaikkaillaātae mañjaraēkkaraŭ; pauṟattaŭ tannae"
62
+ test "പരമാവധി ഊറ്റിയെടുത്തു; എല്ലാം കഴിഞ്ഞ് ഉപേക്ഷിച്ചു: വിങ്ങലോടെ റംസിയുടെ സഹോദരി", "paramaāvadhai ūṟṟaiyaeṭauttau; ellaām kaḻaiññaŭ upaēkṣaiccau: vaiṅṅalaōṭae ṟaṁsaiyauṭae sahaōdarai"
63
+ test "വഴിനീളെ രോഷം; യൂത്ത്‌ കോണ്‍ഗ്രസുകാരന്റെ കയ്യൊടിഞ്ഞു, കൈവീശികാട്ടി ജലീൽ", "vaḻainaīḷae raōṣam; yaūttaŭ kaōṇaŭgrasaukaāranṟae kayyaoṭaiññau, kaaivaīśaikaāṭṭai jalaī:la"
64
+ test "‘വികൃതിപ്പയ്യനാ’യിരുന്ന കോലി മിന്നും താരമായത് ഇന്ത്യൻ ക്രിക്കറ്റിന്റെ ഗുണം: അക്തർ", "‘vaikaṛtaippayyanaā’yairaunna kaōlai mainnaum taāramaāyataŭ intya:ṇa kraikkaṟṟainṟae gauṇam: aktaṟ"
65
+ test "ലോകത്തിനു വാക്സീൻ വേണമെങ്കിൽ ഈ നഗരം കനിയണം; തലയുയർത്തി ഇന്ത്യ", "laōkattainau vaāksaī:ṇa vaēṇamaeṅkai:la ī nagaram kanaiyaṇam; talayauyarttai intya"
66
+ test "‘അദ്ദേഹം ഒരു മകളെപ്പോലെ എന്നെ കേട്ടു’: ഗവർണറെ കണ്ട് കങ്കണ റനൗട്ട്", "‘addaēham orau makaḷaeppaōlae ennae kaēṭṭau’: gavarṇaṟae kaṇṭaŭ kaṅkaṇa ṟanaṭṭaŭ"
67
+ test "‘എല്ലാം ഫെയ്‌സ്ബുക്കില്‍ പറയുമെന്നു ജലീല്‍; കനത്ത സുരക്ഷയില്‍ യാത്ര, കരിങ്കൊടി", "‘ellaām phaeyaŭsbaukkailaŭ paṟayaumaennau jalaīlaŭ; kanatta saurakṣayailaŭ yaātra, karaiṅkaoṭai"
68
+ test "ഏറ്റവും ചെറുപ്പം ജോയി; ജയലക്ഷ്മി, ദീപ്തി, ജ്യോതി; പട്ടികയിലെ നിര ഇങ്ങനെ‌", "ēṟṟavaum caeṟauppam jaōyai; jayalakṣmai, daīptai, jyaōtai; paṭṭaikayailae naira iṅṅanae"
69
+ test "പരിശോധന കുറച്ച് കേരളം; കോവിഡ് ടെസ്റ്റ് പോസിറ്റിവിറ്റി നിരക്ക് എറ്റവും ഉയർന്ന്; ആശങ്ക‌", "paraiśaōdhana kauṟaccaŭ kaēraḷam; kaōvaid̂aŭ ṭaesṟṟaŭ paōsaiṟṟaivaiṟṟai nairakkaŭ eṟṟavaum uyarnnaŭ; āśaṅka"
70
+ test "൱", "100"
71
+ }
72
+
73
+ stage {
74
+
75
+ # RULES
76
+ sub "\u0D4D", "ŭ", after: boundary, before: ""
77
+ sub "\u0D02", "m", after: boundary, before: ""
78
+ sub "\u0D7C", "ṟ", after: boundary, before: ""
79
+
80
+
81
+ # CHARACTERS
82
+ parallel {
83
+ sub "അ", "a"
84
+ sub "ആ", "ā"
85
+ sub "ഇ", "i"
86
+ sub "ഈ", "ī"
87
+ sub "ഉ", "u"
88
+ sub "ഊ", "ū"
89
+ sub "ഋ", "ṛ"
90
+ sub "ൠ", "ṝ"
91
+ sub "ഌ", "ḷ"
92
+ sub "ൡ", "ḹ"
93
+
94
+ sub "എ", "e"
95
+ sub "ഏ", "ē"
96
+ sub "ഐ", "ai"
97
+
98
+ sub "ഒ", "o"
99
+ sub "ഓ", "ō"
100
+ sub "ഔ", "au"
101
+
102
+ # Consonants
103
+ # Gutturals
104
+ sub "ക", "ka"
105
+ sub "ഖ", "kha"
106
+ sub "ഗ", "ga"
107
+ sub "ഘ", "gha"
108
+ sub "ങ", "ṅa"
109
+
110
+ # Palatals
111
+ sub "ച", "ca"
112
+ sub "ഛ", "cha"
113
+ sub "ജ", "ja"
114
+ sub "ഝ", "jha"
115
+ sub "ഞ", "ña"
116
+
117
+ # Cerebrals
118
+ sub "ട", "ṭa"
119
+ sub "ഠ", "ṭha"
120
+ sub "ഡ", "d̂a"
121
+ sub "ഢ", "ḍha"
122
+ sub "ണ", "ṇa"
123
+
124
+ # Dentals
125
+ sub "ത", "ta"
126
+ sub "ഥ", "tha"
127
+ sub "ദ", "da"
128
+ sub "ധ", "dha"
129
+ sub "ന", "na"
130
+
131
+ # Labials
132
+ sub "പ", "pa"
133
+ sub "ഫ", "pha"
134
+ sub "ബ", "ba"
135
+ sub "ഭ", "bha"
136
+ sub "മ", "ma"
137
+
138
+ # Semivowels
139
+ sub "യ", "ya"
140
+ sub "ര", "ra"
141
+ sub "ർ", "r"
142
+ sub "റ", "ṟa"
143
+ sub "ല", "la"
144
+ sub "ള", "ḷa"
145
+ sub "ഴ", "ḻa"
146
+ # Sibilants
147
+ sub "വ", "va"
148
+ sub "ശ", "śa"
149
+ sub "ഷ", "ṣa"
150
+ sub "സ", "sa"
151
+ sub "ഩ", "ṉa"
152
+
153
+
154
+ # Aspirate
155
+ sub "ഹ", "ha"
156
+
157
+ # Bisarga
158
+ sub "ഃ", "ḥ"
159
+
160
+ # Anusvāra
161
+ sub "ം", "ṁ"
162
+
163
+
164
+ # Abagraha
165
+ sub "ഽ", ":’" # (apostrophe)
166
+
167
+ # Medials # Needed for connecting constants
168
+
169
+ sub "ാ", "ā"
170
+ sub "ി", "i"
171
+ sub "ീ", "ī"
172
+ sub "ു", "u"
173
+ sub "ൂ", "ū"
174
+ sub "്", "ŭ"
175
+ sub "ൃ", "ṛ"
176
+ sub "ൄ", "ṝ"
177
+ sub "\u0D62", "ḷ"
178
+ sub "\u0D63", "ḹ"
179
+ sub "െ", "e"
180
+ sub "േ", "ē"
181
+ sub "ൈ", "ai"
182
+ sub "ൊ", "o"
183
+ sub "ോ", "ō"
184
+ sub "ൌ", "au"
185
+
186
+ sub "्", ""
187
+ sub "़", ""
188
+ sub "ൗ", ""
189
+ sub "‍", "" # no need for zero with joiner
190
+ sub "‌", "" # no need for zero with non joiner
191
+
192
+
193
+ # For rule 12
194
+ # Gutturals
195
+ sub "ക്", "k"
196
+ sub "ഖ്", "kh"
197
+ sub "ഗ്", "g"
198
+ sub "ഘ്", "gh"
199
+ sub "ങ്", "ṅ"
200
+
201
+ # Palatals
202
+ sub "ച്", "c"
203
+ sub "ഛ്", "ch"
204
+ sub "ജ്", "j"
205
+ sub "ഝ്", "jh"
206
+ sub "ഞ്", "ñ"
207
+
208
+ # Cerebrals
209
+ sub "ട്", "ṭ"
210
+ sub "ഠ്", "ṭh"
211
+ sub "ഡ്", "d̂"
212
+ sub "ഢ്", "ḍh"
213
+ sub "ണ്", "ṇ"
214
+
215
+ # Dentals
216
+ sub "ത്", "t"
217
+ sub "ഥ്", "th"
218
+ sub "ദ്", "d"
219
+ sub "ധ്", "dh"
220
+ sub "ന്", "n"
221
+
222
+ # Labials
223
+ sub "പ്", "p"
224
+ sub "ഫ്", "ph"
225
+ sub "ബ്", "b"
226
+ sub "ഭ്", "bh"
227
+ sub "മ്", "m"
228
+
229
+ # Semivowels
230
+ sub "യ്", "y"
231
+ sub "ര്", "r"
232
+ sub "റ്", "ṟ"
233
+ sub "ല്", "l"
234
+ sub "ള്", "ḷ"
235
+ sub "ഴ്", "ḻ"
236
+ # Sibilants
237
+ sub "വ്", "v"
238
+ sub "ശ്", "ś"
239
+ sub "ഷ്", "ṣ"
240
+ sub "സ്", "s"
241
+ sub "ഩ്", "ṉ"
242
+
243
+
244
+ # Aspirate
245
+ sub "ഹ്", "h"
246
+
247
+
248
+ # numbers
249
+
250
+ sub "൦", "0"
251
+ sub "൧", "1"
252
+ sub "൨", "2"
253
+ sub "൩", "3"
254
+ sub "൪", "4"
255
+ sub "൫", "5"
256
+ sub "൬", "6"
257
+ sub "൭", "7"
258
+ sub "൮", "8"
259
+ sub "൯", "9"
260
+ sub "൰", "10"
261
+ sub "൱", "100"
262
+ sub "൲", "1000"
263
+
264
+
265
+ # Rule 8(II)
266
+
267
+ sub "ൺ", ":na"
268
+ sub "ൻ", ":ṇa"
269
+ sub "ൽ", ":la"
270
+ sub "ൾ", ":ḷa"
271
+ sub "ൿ", ":ka"
272
+ }
273
+
274
+ compose
275
+ }
276
+