interscript-maps 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,214 @@
1
+ metadata {
2
+ authority_id: ungen
3
+ id: 2017
4
+ language: iso-639-3:prs
5
+ # prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
6
+ source_script: Arab
7
+ destination_script: Latn
8
+ name: Persian UN 1967
9
+ url: http://www.eki.ee/wgrs/v2_2/rom1_fa.htm
10
+ creation_date: 1967
11
+ confirmation_date: 01-2003
12
+ description: |
13
+ The United Nations recommended system was approved in 1967 (
14
+ I/13), based on the official system adopted by Iran and
15
+ published in its English version as Transliteration of
16
+ Farsi Geographic Names to Latin Alphabet (September 1966).
17
+ The romanization table was also published as an annex to
18
+ the Toponymic Guidelines for the Islamic Republic of Iran
19
+ in 2000 (Toponymic Guidelines for map and other editors –
20
+ Revised edition 1998. Submitted by the Islamic Republic of
21
+ Iran. UNGEGN, 20th session. New York, 17-28 January 2000,
22
+ Working Paper No. 41.).
23
+
24
+ The system is used in the Islamic Republic of Iran and in
25
+ international cartographic products.
26
+
27
+ Persian (Farsi) uses the Perso-Arabic script that is
28
+ written from right to left. The Persian script usually
29
+ omits vowel points and diacritical marks from writing which
30
+ makes it difficult to obtain uniform results in the
31
+ romanization of Persian. The romanization is generally
32
+ reversible though there are some ambiguous letter
33
+ sequences (kh, sh, th, zh) which also may represent the
34
+ romanized values of two Persian characters in addition to
35
+ the respective single ones.
36
+
37
+
38
+ notes:
39
+ - A Word-initially.
40
+ - B Not romanized; marks absence of the vowel.
41
+ - C Doubling of the consonant letter.
42
+ - D After a consonant (excl. -ah).
43
+ - E After a vowel (see also note 2).
44
+ - 1-The adjectival ending of Arabic origin -يه in Persian is
45
+ romanized -īyeh. In romanizing the definite article the
46
+ same rules of assimilation of consonants are applied as in
47
+ Arabic, e.g. زين الدين Zeyn od Dīn.
48
+
49
+ - 2-The relational suffix (eẕāfeh) -e is usually not
50
+ expressed in Persian writing after a consonant. After final
51
+ ا or و it is written with ى, e.g. پاى آب Pā-ye Āb. After
52
+ final ى and ه it is expressed by writing hamzeh over the
53
+ character دهانۀ ممبر Dahāneh-ye Mambar.
54
+
55
+ - 3-To point Persian vowels two systems are in use that are
56
+ separated by a column in the table. The first system is a
57
+ Persian one while the other adheres to the Arabic
58
+ tradition. In normal spelling vowel points are not used.
59
+ }
60
+
61
+ tests {
62
+ test "اَنجِيرة", "Anjīrah"
63
+ test "اِيْوَانِي", "Eyvānī"
64
+ test "آبَادَان", "Ābādān"
65
+ test "قُرآن", "Qor’ān"
66
+ test "مَآب", "Ma’āb"
67
+ test "مُحَمَّد", "Moḩammad"
68
+ test "كُوهِ مَرغُوب", "Kūh-e Marghūb"
69
+ test "پَايِ آب", "Pā-ye Āb"
70
+ test "جُويِ آس", "Jū-ye Ās"
71
+ test "دَهَانِهٴ مَمبَر", "Dahāneh-ye Mambar"
72
+ test "سَلَسِيٴ بُذُرگ", "Salasī-ye Boz̄org"
73
+ test "ذُو الفَقَار", "Z̄ū ol Faqār"
74
+ }
75
+
76
+ stage {
77
+ # CHARACTERS
78
+ parallel {
79
+
80
+ sub "\u064e", "a" # َ fatha
81
+ sub "\u064e", "", after: "\u0629" # َ fatha followed by ta' marboota
82
+ sub "\u064e", "", after: "a" + any("ht") # َ fatha followed by ta' marboota, handling different order of conversion
83
+ sub "\u0650", "e" # ِ kasra
84
+ sub "\u064f", "o" # ُ damma
85
+ sub "\u0652", "" # ْ sokoon, see Note B
86
+
87
+ sub "\u064e\u0627", "ā" # ـَا fatha followed by ا
88
+ sub "\u064e\u0649", "á" # ـَى fatha followed by ى which is ا not ي
89
+ sub boundary + "\u0622", "ā" # آ NOTE A
90
+ sub "\u0622", "’ā" # آ
91
+ sub "\u0650\u064a", "ī" # ـِي kasra followed by ي
92
+ sub "\u064f\u0648", "ū" # ـُو damma followed by و
93
+ sub any("\u064e\u0650") + "\u064a\u0652", "ey" # ـَيْ
94
+ sub any("\u064e\u064f") + "\u0648\u0652", "ow" # ـَوْ
95
+ sub "\u0621", "’" # ء
96
+ sub "\u2013", "–"
97
+ sub "\u2013" + any("\u0649\u064a") + "\u0647", "-īyeh"
98
+ sub any("\u0654\u0674"), "-e" # ٴ ezafeh
99
+ sub any("\u0654\u0674"), "-ye", before: any("\u064a\u0647") # ٴ ezafeh
100
+ sub "\u0650" + boundary, "-e" # ِ kasra
101
+ sub any("\u064a\u06cc") + "\u0650" + boundary, "-ye" # ِ kasra
102
+
103
+ # NOTE C
104
+ sub "\u0628\u0651", "bb" # ب
105
+ sub "\u062a\u0651", "tt" # ت
106
+ sub "\u062b\u0651", "s̄s̄" # ث
107
+ sub "\u062c\u0651", "jj" # ج
108
+ sub "\u062d\u0651", "ḩḩ" # ح
109
+ sub "\u062e\u0651", "kh" # خ
110
+ sub "\u062f\u0651", "dd" # د
111
+ sub "\u0630\u0651", "z̄z̄" # ذ
112
+ sub "\u0631\u0651", "rr" # ر
113
+ sub "\u0632\u0651", "zz" # ز
114
+ sub "\u0633\u0651", "ss" # س
115
+ sub "\u0634\u0651", "sh" # ش
116
+ sub "\u0635\u0651", "şş" # ص
117
+ sub "\u0636\u0651", "ẕẕ" # ض
118
+ sub "\u0637\u0651", "ţţ" # ط
119
+ sub "\u0638\u0651", "z̧z̧" # ظ
120
+ sub "\u063a\u0651", "gh" # غ
121
+ sub "\u0641\u0651", "ff" # ف
122
+ sub "\u0642\u0651", "qq" # ق
123
+ sub "\u0643\u0651", "kk" # ك
124
+ sub "\u0644\u0651", "ll" # ل
125
+ sub "\u0645\u0651", "mm" # م
126
+ sub "\u0646\u0651", "nn" # ن
127
+ sub "\u0647\u0651", "hh" # ه
128
+ sub "\u0648\u0651", "vv" # و
129
+ sub "\u064a\u0651", "yy" # ي
130
+
131
+ # NOTE 1
132
+ # Sun letters
133
+ sub boundary + "\u0627\u0644\u062a", "ot t" # الت
134
+ sub boundary + "\u0627\u0644\u062b", "os̄ s̄" # الث
135
+ sub boundary + "\u0627\u0644\u062f", "od d" # الد
136
+ sub boundary + "\u0627\u0644\u0630", "oz̄ z̄" # الذ
137
+ sub boundary + "\u0627\u0644\u0631", "or r" # الر
138
+ sub boundary + "\u0627\u0644\u0632", "oz z" # الز
139
+ sub boundary + "\u0627\u0644\u0633", "os s" # الس
140
+ sub boundary + "\u0627\u0644\u0634", "osh sh" # الش
141
+ sub boundary + "\u0627\u0644\u0635", "oş ş" # الص
142
+ sub boundary + "\u0627\u0644\u0636", "oẕ ẕ" # الض
143
+ sub boundary + "\u0627\u0644\u0637", "oţ ţ" # الط
144
+ sub boundary + "\u0627\u0644\u0638", "oz̧ z̧" # الظ
145
+ sub boundary + "\u0627\u0644\u0644", "ol l" # الل
146
+ sub boundary + "\u0627\u0644\u0646", "on n" # الن
147
+
148
+ sub "\u0650\u064a\u0651", "īy" # ـِيَّ
149
+ sub "\u0650\u064a", "iy", after: any("\u064e\u064f") # ـِي kasra followed by ي
150
+
151
+ # ta' marboota
152
+ sub "\u0629", "at" # ة in the middle of the sentence
153
+ sub "\u0629" + line_end, "ah"
154
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
155
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
156
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
157
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
158
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
159
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
160
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
161
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
162
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
163
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
164
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
165
+ sub "\u0629", "ah", before: boundary + "\u0627\u0644" + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff") + any("\u0600".."\u06ff")
166
+
167
+ sub boundary + "\u0627\u0644", "al " # ال
168
+ sub space + boundary + "\u0627\u0644", " ol " # ال #special Rule 1
169
+
170
+ sub boundary + "\u0627", "" # ا initial
171
+ sub "\u0627", "ā" # ا middial
172
+ sub "\u0627" + boundary, "ā" # ا final
173
+
174
+ sub "\u0628", "b" # ب
175
+ sub "\u067E", "p" # پ
176
+ sub "\u062A", "t" # ت
177
+ sub "\u062B", "s̄" # ث
178
+ sub "\u062C", "j" # ج
179
+ sub "\u0686", "ch" # ‫چ‬
180
+ sub "\u062D", "ḩ" # ح
181
+ sub "\u062E", "kh" # خ
182
+ sub "\u062F", "d" # د
183
+ sub "\u0630", "z̄" # ذ
184
+ sub "\u0631", "r" # ر
185
+ sub "\u0632", "z" # ز
186
+ sub "\u0698", "zh" # ‫ژ‬
187
+ sub "\u0633", "s" # س
188
+ sub "\u0634", "sh" # ش
189
+ sub "\u0635", "ş" # ص
190
+ sub "\u0636", "ẕ" # ض
191
+ sub "\u0637", "ţ" # ط
192
+ sub "\u0638", "z̧" # ظ
193
+ sub "\u0639", "’" # ع
194
+ sub "\u063A", "gh" # غ
195
+ sub "\u0641", "f" # ف
196
+ sub "\u0642", "q" # ق
197
+ sub "\u0643", "k" # ك
198
+ sub "\u06A9", "k" # ک
199
+ sub "\u06AF", "g" # گ
200
+ sub "\u0644", "l" # ل‫‬
201
+ sub "\u0645", "m" # م
202
+ sub "\u0646", "n" # ن
203
+ sub "\u0648", "v" # و
204
+ sub "\u0647", "h" # ه
205
+ sub "\u0649", "y" # ي
206
+ sub "\u064a", "y" # ي
207
+ }
208
+
209
+ # POSTRULES
210
+ sub any("\u0061".."\uFFFF"), upcase, before: boundary, not_before: boundary + any("‘’'-")
211
+
212
+ sub " Al", " al"
213
+ sub " Ol", " ol"
214
+ }
@@ -0,0 +1,96 @@
1
+ metadata {
2
+ authority_id: ungegn
3
+ id: 1987
4
+ language: iso-639-2:rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Russian Romanization system
8
+ url: http://www.eki.ee/wgrs/rom1_ru.htm
9
+ creation_date: 1987
10
+ confirmation_date: 2016
11
+ description: |
12
+ The United Nations recommended system was approved in 1987 (V/18),
13
+ based on the official system of the Main Administration of Geodesy and
14
+ Cartography of the former Soviet Union, also known as the GOST 1983
15
+ system (GOST 16876-71). The table was published as an annex to the
16
+ resolution.
17
+
18
+ The system is used in the Russian Federation and increasingly in
19
+ international cartographic products.
20
+
21
+ Russian uses the Cyrillic script which is alphabetic. The
22
+ romanization table is unambiguous and can be applied automatically. The
23
+ system is reversible, although rarely there can be ambiguities.
24
+
25
+ notes:
26
+ - "Cursive forms of some characters might be formed differently: Аа Бб
27
+ Вв Гг Дд Ее Ёё Жж Зз Ии Йй Кк Лл Мм Нн Оо Пп Рр Сс Тт Уу Фф Хх Цц Чч Шш
28
+ Щщ Ъъ Ыы Ьь Ээ Юю Яя."
29
+
30
+ - Fifth United Nations Conference on the Standardization of
31
+ Geographical Names. Montreal, 18–31 August 1987. Vol. I. Report of the
32
+ Conference, pp. 40–41.
33
+ }
34
+
35
+ tests {
36
+ test "Aнaпa", "Anapa"
37
+ test "Бaбушкин", "Babuškin"
38
+ test "Вaвилово", "Vavilovo"
39
+ test "Гaгaрин", "Gagarin"
40
+ test "Дудинкa", "Dudinka"
41
+ test "Елисeeвкa", "Eliseevka"
42
+ test "Ёлкино", "Ëlkino"
43
+ test "Псëл", "Psël"
44
+ test "Жужa", "Žuža"
45
+ test "Звëздный", "Zvëzdnyj"
46
+ test "Идрицa", "Idrica"
47
+ test "Зaрaйск", "Zarajsk"
48
+ test "Кокaнд", "Kokand"
49
+ test "Лaлвaр", "Lalvar"
50
+ test "Мaймaк", "Majmak"
51
+ test "Нeжин", "Nežin"
52
+ test "Обoдoвкa", "Obodovka"
53
+ test "Пaп", "Pap"
54
+ test "Рeбрихa", "Rebriha"
55
+ test "Сaсoвo", "Sasovo"
56
+ test "Тaттa", "Tatta"
57
+ test "Уржум", "Uržum"
58
+ test "Фoфaнoвo", "Fofanovo"
59
+ test "Хoхломa", "Hohloma"
60
+ test "Цвeткoвo", "Cvetkovo"
61
+ test "Чeчeльник", "Čečel’nik"
62
+ test "Шишкинo", "Šiškino"
63
+ test "Щукинo", "Ščukino"
64
+ test "Пoдъячeвo", "Pod”jačevo"
65
+ test "Ыныкчaнский", "Ynykčanskij"
66
+ test "Пaрaньгa", "Paran’ga"
67
+ test "Кaзaнь", "Kazan’"
68
+ test "Щучьe", "Ščuč’e"
69
+ test "Элистa", "Èlista"
70
+ test "Юринo", "Jurino"
71
+ test "Юхнoв", "Juhnov"
72
+ test "Юрюзaнь", "Jurjuzan’"
73
+ test "Ямaл", "Jamal"
74
+ test "Язъявaн", "Jaz”javan"
75
+ test "Яя", "Jaja"
76
+ test "Вязьмa", "Vjaz’ma"
77
+ }
78
+
79
+ dependency "gost-rus-Cyrl-Latn-16876-71-1983", as: cyrllatn
80
+
81
+
82
+ stage {
83
+ # CHARACTERS
84
+ parallel {
85
+ sub "\u042A", "”" # Ъ
86
+ sub "\u042C", "’" # Ь
87
+ sub "\u044A", "”" # ъ
88
+ sub "\u044C", "’" # ь
89
+ sub "\u042E", "Ju" # Ю
90
+ sub "\u044E", "ju" # ю
91
+ sub "\u042F", "Ja" # Я
92
+ sub "\u044F", "ja" # я
93
+ }
94
+
95
+ run map.cyrllatn.stage.main
96
+ }
@@ -0,0 +1,193 @@
1
+ metadata {
2
+ authority_id: un
3
+ id: 1972
4
+ language: iso-639-2:sin
5
+ source_script: Sinh
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Sinhalese Romanization Version 4.0
8
+ url: https://www.eki.ee/wgrs/rom1_ml.htm
9
+ creation_date: 1972
10
+ confirmation_date: 2016
11
+ description: |
12
+ There does not seem to exist any national systems of romanization for Sinhalese (Sinhala) in Sri Lanka.
13
+
14
+ In 1972, D. N. Sharma prepared a romanization table for Sinhalese (Sinhala) which was published in vol. II
15
+ of the conference report together with the other languages of the Indian group1.
16
+
17
+ Sinhalese uses an alphasyllabic script whereby each character represents a syllable rather than one sound.
18
+ Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially) and in an
19
+ abbreviated form, to denote vowels after consonants.
20
+
21
+
22
+ notes:
23
+ - |
24
+ The character ඇ was romanized as a͝i and the character ඈ as ai in Sharma's table, but there was no romanization for the character ඓ which,
25
+ though rarely used, represents the ai proper of the Indian languages; here the romanization of these characters is given in accordance with the pronunciation.
26
+ - |
27
+ ැ ෑ Exceptions: රැ ræ̆, රෑ ræ.
28
+ - |
29
+ ු Exceptions: කූ kū, ගූ gū, තූ tū, භූ bhū, රූ rū, ශූ shū.
30
+ - |
31
+ ූ Exceptions: කූ kū, ගූ gū, තූ tū, භූ bhū, රූ rū, ශූ shū
32
+ - |
33
+ ් Marks absence of the inherent vowel. Special forms: ඛ් kh, ඞ් ṅ, ච් ch, ට් ṭ, ඩ් ḍ, ධ් dh, බ් b, ම් m, ව් v.
34
+ - |
35
+ ඛ ඝ ඞ ච ඡ ඣ ඤ ඨ ඪ ථ ධ ඵ භ ශ ෂ These consonants are used only in Sanskrit and Pali loanwords.
36
+ }
37
+
38
+ tests {
39
+ test "ශී‍්‍ර ලංකාවේ කී‍්‍රඩාව ඉතිහාසයේ ඉහළම තැනකට ගේන්න කටයුතු කරනවා", "shīra laṁkāve kīraḍāva itihāsaye ihaḷama tæ̆nakaṭa genna kaṭayutu karanavā"
40
+ test "කොච්චිකඬේ මෝයකට අසල නෑමට ගිය තරුණයෝ ෩ක් මරුට - මිතුරාගේ උපන් දිනය සැමරීමට ඇවිත්", "kŏchchikaඬe moyakaṭa asala næmaṭa giya taruṇayo 3k maruṭa - miturāge upan dinaya sæ̆marīmaṭa æ̆vit"
41
+ test "ලෝක ළමා දිනයදා සිසුන් පිරිසක් කසිප්පු බීලා", "loka ḷamā dinayadā sisun pirisak kasippu bīlā"
42
+ test "කෝටි 16ක හෙරොයින් සමග දන්කොටුවේදී 7ක් දැලේ", "koṭi 16ka hĕrŏyin samaga dankŏṭuvedī 7k dæ̆le"
43
+ test "මිනුවන්ගොඩ පීසීආර් දෙදහසක් සිදුකරයි", "minuvangŏḍa pīsīār dĕdahasak sidukarayi"
44
+ test "පාස්කු ප‍්‍රහාරය වගේම පාස්කු ප්‍රෝඩාව ගැනත් සොයන්න කොමිසමක් පත්කළ යුතුයි - විපක්‍ෂ නායක සජිත් පේ‍්‍රමදාස", "pāsku parahāraya vagema pāsku proḍāva gæ̆nat sŏyanna kŏmisamak patkaḷa yutuyi - vipakṣha nāyaka sajit peramadāsa"
45
+ test "ට‍්‍රම්ප්ගේ සෞඛ්‍යය තීරණාත්මකයි - ට්විටර් හරහා ජනතාව අමතයි", "ṭarampge saukhyaya tīraṇātmakayi - ṭviṭar harahā janatāva amatayi"
46
+ test "පාස්කු දා ප‍්‍රහාරය පිළිබඳ පරීක්‍ෂණවලින් කිසිවකුට අසාධාරණයක් වීමට ඉඩ දෙන්නේ නෑ - අගමැති", "pāsku dā parahāraya piḷibaඳ parīkṣhaṇavalin kisivakuṭa asādhāraṇayak vīmaṭa iḍa dĕnne næ - agamæ̆ti"
47
+ test "දිල්ලි කැපිටල්ස් සහ කෝලිගේ බැංගලෝර් තෙවැනි ජය ලබයි", "dilli kæ̆piṭals saha kolige bæ̆ṁgalor tĕvæ̆ni jaya labayi"
48
+ test "ශ‍්‍රී ලාංකික සම්භවයක් සහිත ප‍්‍රංශයේ පවුලක 5 ක් ඝාතනය කරලා", "sharī lāṁkika sambhavayak sahita paraṁshaye pavulaka 5 k ghātanaya karalā"
49
+ test "පැතිකුදය ඉක්මනින් සුව කරන ප‍්‍රතිකාර", "pæ̆tikudaya ikmanin suva karana paratikāra"
50
+ }
51
+
52
+ aliases {
53
+ def_alias sinh_chars_1, any("\u0dcf\u0dd0\u0dd1\u0dd2\u0dd3\u0dd4\u0dd6\u0dd8\u0df2\u0dd9\u0dda\u0ddb\u0ddc\u0ddd\u0dde\u0dca")
54
+ }
55
+
56
+ stage {
57
+
58
+ # RULES
59
+ sub "ක", "k", after: sinh_chars_1
60
+ sub "ඛ", "kh", after: sinh_chars_1
61
+ sub "ග", "g", after: sinh_chars_1
62
+ sub "ඝ", "gh", after: sinh_chars_1
63
+ sub "ඞ", "ṅ", after: sinh_chars_1
64
+ sub "ච", "ch", after: sinh_chars_1
65
+ sub "ඡ", "chh", after: sinh_chars_1
66
+ sub "ජ", "j", after: sinh_chars_1
67
+ sub "ඣ", "jh", after: sinh_chars_1
68
+ sub "ඤ", "ñ", after: sinh_chars_1
69
+ sub "ට", "ṭ", after: sinh_chars_1
70
+ sub "ඨ", "ṭh", after: sinh_chars_1
71
+ sub "ඩ", "ḍ", after: sinh_chars_1
72
+ sub "ඪ", "ḍh", after: sinh_chars_1
73
+ sub "ණ", "ṇ", after: sinh_chars_1
74
+ sub "ත", "t", after: sinh_chars_1
75
+ sub "ථ", "th", after: sinh_chars_1
76
+ sub "ද", "d", after: sinh_chars_1
77
+ sub "ධ", "dh", after: sinh_chars_1
78
+ sub "න", "n", after: sinh_chars_1
79
+ sub "ප", "p", after: sinh_chars_1
80
+ sub "ඵ", "ph", after: sinh_chars_1
81
+ sub "බ", "b", after: sinh_chars_1
82
+ sub "භ", "bh", after: sinh_chars_1
83
+ sub "ම", "m", after: sinh_chars_1
84
+ sub "ය", "y", after: sinh_chars_1
85
+ sub "ර", "r", after: sinh_chars_1
86
+ sub "ල", "l", after: sinh_chars_1
87
+ sub "ව", "v", after: sinh_chars_1
88
+ sub "ශ", "sh", after: sinh_chars_1
89
+ sub "ෂ", "ṣh", after: sinh_chars_1
90
+ sub "ස", "s", after: sinh_chars_1
91
+ sub "හ", "h", after: sinh_chars_1
92
+ sub "ෆ", "f", after: sinh_chars_1
93
+ sub "ළ", "ḷ", after: sinh_chars_1
94
+
95
+
96
+ # CHARACTERS
97
+ parallel {
98
+ # I. Independent vowel characters
99
+ sub "අ", "a"
100
+ sub "ආ", "ā"
101
+ sub "ඇ", "æ̆"
102
+ sub "ඈ", "æ"
103
+ sub "ඉ", "i"
104
+ sub "ඊ", "ī"
105
+ sub "උ", "u"
106
+ sub "ඌ", "ū"
107
+ sub "ඍ", "ṛ"
108
+ sub "ඎ", "ṝ"
109
+ sub "එ", "ĕ"
110
+ sub "ඒ", "e"
111
+ sub "ඓ", "ai"
112
+ sub "ඔ", "ŏ"
113
+ sub "ඕ", "o"
114
+ sub "ඖ", "au"
115
+
116
+ # II. Abbreviated vowel characters and other symbols
117
+ sub "ා", "ā"
118
+ sub "ැ", "æ̆"
119
+ sub "ෑ", "æ"
120
+ sub "ි", "i"
121
+ sub "ී", "ī"
122
+ sub "ු", "u"
123
+ sub "ූ", "ū"
124
+ sub "ෘ", "ṛ"
125
+ sub "ෲ", "ṝ"
126
+ sub "ෙ", "ĕ"
127
+ sub "ේ", "e"
128
+ sub "ෛ", "ai"
129
+ sub "ො", "ŏ"
130
+ sub "ෝ", "o"
131
+ sub "ෞ", "au"
132
+ sub "ඃ", "ḥ"
133
+ sub "ං", "ṁ"
134
+ sub "්", ""
135
+
136
+
137
+ # III. Consonant characters
138
+ sub "ක", "ka"
139
+ sub "ඛ", "kha"
140
+ sub "ග", "ga"
141
+ sub "ඝ", "gha"
142
+ sub "ඞ", "ṅa"
143
+ sub "ච", "cha"
144
+ sub "ඡ", "chha"
145
+ sub "ජ", "ja"
146
+ sub "ඣ", "jha"
147
+ sub "ඤ", "ña"
148
+ sub "ට", "ṭa"
149
+ sub "ඨ", "ṭha"
150
+ sub "ඩ", "ḍa"
151
+ sub "ඪ", "ḍha"
152
+ sub "ණ", "ṇa"
153
+ sub "ත", "ta"
154
+ sub "ථ", "tha"
155
+ sub "ද", "da"
156
+ sub "ධ", "dha"
157
+ sub "න", "na"
158
+ sub "ප", "pa"
159
+ sub "ඵ", "pha"
160
+ sub "බ", "ba"
161
+ sub "භ", "bha"
162
+ sub "ම", "ma"
163
+ sub "ය", "ya"
164
+ sub "ර", "ra"
165
+ sub "ල", "la"
166
+ sub "ව", "va"
167
+ sub "ශ", "sha"
168
+ sub "ෂ", "ṣha"
169
+ sub "ස", "sa"
170
+ sub "හ", "ha"
171
+ sub "ෆ", "fa"
172
+ sub "ළ", "ḷa"
173
+
174
+ # numbers
175
+ sub "\u0DE6", "0"
176
+ sub "\u0DE7", "1"
177
+ sub "\u0DE8", "2"
178
+ sub "\u0DE9", "3"
179
+ sub "\u0DEA", "4"
180
+ sub "\u0DEB", "5"
181
+ sub "\u0DEC", "6"
182
+ sub "\u0DED", "7"
183
+ sub "\u0DEE", "8"
184
+ sub "\u0DEF", "9"
185
+
186
+
187
+ sub "‍", "" # Used for joining
188
+ sub "‌", "" # Used for non joining
189
+ }
190
+
191
+ compose
192
+ }
193
+