interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,101 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:aze
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ALA-LC Romanization Table -- Azerbaijani (1997)
8
+ url: https://transliteration.eki.ee/pdf/Azerbaijani.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization Tables: Transliteration Schemes for Non-Roman Scripts. Randal K. Berry (ed.). Library of Congress, 1997.
12
+
13
+ notes:
14
+ - "Ј ј replaced Й й in 1959 (Roman: y; ISO 9: j; ALA-LC: ĭ)."
15
+ }
16
+
17
+ tests {
18
+ # from internet
19
+ test "Азәрбајҹан дили", "Azărbaı̐jan dili"
20
+ test "Бүтүн инсанлар ләјагәт вә һүгугларына ҝөрә азад вә бәрабәр доғулурлар.\nОнларын шүурлары вә виҹданлары вар вә бир-бирләринә мүнасибәтдә гардашлыг руһунда давранмалыдырлар.", "Bu̇tu̇n insanlar lăı̐agăt vă ḣu̇guglaryna ġȯră azad vă bărabăr doghulurlar.\nOnlaryn shu̇urlary vă vijdanlary var vă bir-birlărină mu̇nasibătdă gardashlyg ruḣunda davranmalydyrlar."
21
+ test "Азәрбајҹан! Азәрбајҹан!\nЕј гәһрәман өвладын шанлы Вәтәни!\nСәндән өтрү ҹан вермәјә ҹүмлә һазырыз!\nСәндән өтрү ган төкмәјә ҹүмлә гадириз!\nҮчрәнҝли бајрағынла мәсуд јаша!\nҮчрәнҝли бајрағынла мәсуд јаша!\nМинләрлә ҹан гурбан олду,\nСинән һәрбә мејдан олду!\nҺүгугундан кечән әсҝәр,\nҺәрә бир гәһрәман олду!\nСән оласан ҝүлүстан,\nСәнә һәр ан ҹан гурбан!\nСәнә мин бир мәһәббәт\nСинәмдә тутмуш мәкан!\nНамусуну һифз етмәјә,\nБајрағыны јүксәлтмәјә\nНамусуну һифз етмәјә,\nҸүмлә ҝәнҹләр мүштагдыр!\nШанлы Вәтән! Шанлы Вәтән!\nАзәрбајҹан! Азәрбајҹан!\nАзәрбајҹан! Азәрбајҹан!", "Azărbaı̐jan! Azărbaı̐jan!\nEı̐ găḣrăman ȯvladyn shanly Vătăni!\nSăndăn ȯtru̇ jan vermăı̐ă ju̇mlă ḣazyryz!\nSăndăn ȯtru̇ gan tȯkmăı̐ă ju̇mlă gadiriz!\nU̇chrănġli baı̐raghynla măsud ı̐asha!\nU̇chrănġli baı̐raghynla măsud ı̐asha!\nMinlărlă jan gurban oldu,\nSinăn ḣărbă meı̐dan oldu!\nḢu̇gugundan kechăn ăsġăr,\nḢără bir găḣrăman oldu!\nSăn olasan ġu̇lu̇stan,\nSănă ḣăr an jan gurban!\nSănă min bir măḣăbbăt\nSinămdă tutmush măkan!\nNamusunu ḣifz etmăı̐ă,\nBaı̐raghyny ı̐u̇ksăltmăı̐ă\nNamusunu ḣifz etmăı̐ă,\nJu̇mlă ġănjlăr mu̇shtagdyr!\nShanly Vătăn! Shanly Vătăn!\nAzărbaı̐jan! Azărbaı̐jan!\nAzărbaı̐jan! Azărbaı̐jan!"
22
+ }
23
+
24
+ stage {
25
+
26
+ # CHARACTERS
27
+ parallel {
28
+ sub "\u0410", "A" # А
29
+ sub "\u0411", "B" # Б
30
+ sub "\u0412", "V" # В
31
+ sub "\u0413", "G" # Г
32
+ sub "\u0492", "Gh" # Ғ
33
+ sub "\u0414", "D" # Д
34
+ sub "\u0415", "E" # Е
35
+ sub "\u04D8", "Ă" # Ә
36
+ sub "\u0416", "Zh" # Ж
37
+ sub "\u0417", "Z" # З
38
+ sub "\u0418", "I" # И
39
+ sub "\u042B", "Y" # Ы
40
+ sub "\u0408", "I̐" # Ј
41
+ sub "\u0419", "Y" # Й note[1]
42
+ sub "\u0419", "Y" # Й
43
+ sub "\u041A", "K" # К
44
+ sub "\u049C", "Ġ" # Ҝ
45
+ sub "\u041B", "L" # Л
46
+ sub "\u041C", "M" # М
47
+ sub "\u041D", "N" # Н
48
+ sub "\u041E", "O" # О
49
+ sub "\u04E8", "Ȯ" # Ө
50
+ sub "\u041F", "P" # П
51
+ sub "\u0420", "R" # Р
52
+ sub "\u0421", "S" # С
53
+ sub "\u0422", "T" # Т
54
+ sub "\u0423", "U" # У
55
+ sub "\u04AE", "U̇" # Ү
56
+ sub "\u0424", "F" # Ф
57
+ sub "\u0425", "Kh" # Х
58
+ sub "\u04BA", "Ḣ" # Һ
59
+ sub "\u0427", "Ch" # Ч
60
+ sub "\u04B8", "J" # Ҹ
61
+ sub "\u0428", "Sh" # Ш
62
+
63
+ sub "\u0430", "a" # а
64
+ sub "\u0431", "b" # б
65
+ sub "\u0432", "v" # в
66
+ sub "\u0433", "g" # г
67
+ sub "\u0493", "gh" # ғ
68
+ sub "\u0434", "d" # д
69
+ sub "\u0435", "e" # e
70
+ sub "\u04D9", "ă" # ә
71
+ sub "\u0436", "zh" # ж
72
+ sub "\u0437", "z" # з
73
+ sub "\u0438", "i" # и
74
+ sub "\u044B", "y" # ы
75
+ sub "\u0458", "ı̐" # ј
76
+ sub "\u0439", "y" # й note[1]
77
+ sub "\u043A", "k" # к
78
+ sub "\u049D", "ġ" # ҝ
79
+ sub "\u043B", "l" # л
80
+ sub "\u043C", "m" # м
81
+ sub "\u043D", "n" # н
82
+ sub "\u043E", "o" # о
83
+ sub "\u04E9", "ȯ" # ө
84
+ sub "\u043F", "p" # п
85
+ sub "\u0440", "r" # р
86
+ sub "\u0441", "s" # с
87
+ sub "\u0442", "t" # т
88
+ sub "\u0443", "u" # у
89
+ sub "\u04AF", "u̇" # ү
90
+ sub "\u0444", "f" # ф
91
+ sub "\u0445", "kh" # х
92
+ sub "\u04BB", "ḣ" # һ
93
+ sub "\u0447", "ch" # ч
94
+ sub "\u04B9", "j" # ҹ
95
+ sub "\u0448", "sh" # ш
96
+
97
+ sub "\u2019", "\u2019"
98
+ }
99
+
100
+ compose
101
+ }
@@ -0,0 +1,118 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ALA-LC Romanization Table -- Byelorussian (1997)
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/beloruss.pdf
9
+ creation_date: 1997
10
+
11
+ notes:
12
+ - Ґ letter found in Old Belarusian and in modern publications in Tarashkevitsa orthography.
13
+ - Do not confuse with the digraph кг (also romanized as “kh”). Manual review may be needed when transcribing data in vernacular characters in order to distinguish х from кг.
14
+ - The apostrophe (´) is not transliterated.
15
+ - Soft sign (prime) is USMARC hexadecimal code A7 ~ U+02B9 Unicode character
16
+ }
17
+
18
+ tests {
19
+ # https://en.wikipedia.org/wiki/Romanization_of_Belarusian#Examples
20
+ # https://img.tyt.by/n/02/d/belorusskiy_translit.jpg - with issues
21
+ test "Беларусь", "Belarusʹ"
22
+ test "Магілёў", "Mahili͡oŭ"
23
+ test "Лукашэнка", "Lukashėnka"
24
+ test "сям´я", "si͡ami͡a"
25
+ test "Уручча", "Uruchcha"
26
+ test "Барысаўскі тракт", "Barysaŭski trakt"
27
+ test "Усход", "Uskhod"
28
+ test "Маскоўская", "Maskoŭskai͡a"
29
+ test "Парк Чалюскінцаў", "Park Chali͡uskintsaŭ"
30
+ test "Акадэмія навук", "Akadėmii͡a navuk"
31
+ test "Плошча Якуба Коласа", "Ploshcha I͡Akuba Kolasa"
32
+ test "Плошча Перамогі", "Ploshcha Peramohi"
33
+ test "Кастрычніцкая", "Kastrychnitskai͡a"
34
+ test "Плошча Леніна", "Ploshcha Lenina"
35
+ test "Інстытут Культуры", "Instytut Kulʹtury"
36
+ }
37
+
38
+ stage {
39
+
40
+ # CHARACTERS
41
+ parallel {
42
+ # Apostrophes
43
+ sub "\u00B4", "" # official english Apostrophe
44
+ sub "\u02BC", ""
45
+ sub "\u0027", "" # from belarussian keyboard
46
+
47
+ # Characters
48
+ sub "\u0410", "A" # A
49
+ sub "\u0411", "B" # Б
50
+ sub "\u0412", "V" # B
51
+ sub "\u0413", "H" # Г
52
+ sub "\u0490", "G" # Ґ
53
+ sub "\u0414", "D" # Д
54
+ sub "\u0415", "E" # Е
55
+ sub "\u0401", "I͡O" # Ё : I͡O
56
+ sub "\u0416", "Z͡H" # Ж : Z͡H
57
+ sub "\u0417", "Z" # З
58
+ sub "\u0406", "I" # І
59
+ sub "\u0419", "Ĭ" # Й : Ĭ
60
+ sub "\u041A", "K" # К
61
+ sub "\u041B", "L" # Л
62
+ sub "\u041C", "M" # М
63
+ sub "\u041D", "N" # Н
64
+ sub "\u041E", "O" # О
65
+ sub "\u041F", "P" # П
66
+ sub "\u0420", "R" # Р
67
+ sub "\u0421", "S" # С
68
+ sub "\u0422", "T" # Т
69
+ sub "\u0423", "U" # У
70
+ sub "\\U040E", "Ŭ" # Ў : Ŭ
71
+ sub "\u0424", "F" # Ф
72
+ sub "\u0425", "Kh" # Х
73
+ sub "\u0426", "Ts" # Ц
74
+ sub "\u0427", "Ch" # Ч
75
+ sub "\u0428", "Sh" # Ш
76
+ sub "\u042B", "Y" # Ы
77
+ sub "\u042C", "ʹ" # Ь : ʹ
78
+ sub "\u042D", "Ė" # Э : Ė
79
+ sub "\u042E", "I͡U" # Ю : I͡U
80
+ sub "\u042F", "I͡A" # Я : I͡A
81
+
82
+ sub "\u0430", "a" # а
83
+ sub "\u0431", "b" # б
84
+ sub "\u0432", "v" # в
85
+ sub "\u0433", "h" # г
86
+ sub "\u0491", "g" # ґ
87
+ sub "\u0434", "d" # д
88
+ sub "\u0435", "e" # е
89
+ sub "\u0451", "i͡o" # ё : i͡o
90
+ sub "\u0436", "z͡h" # ж : z͡h
91
+ sub "\u0437", "z" # з
92
+ sub "\u0456", "i" # і
93
+ sub "\u0439", "ĭ" # й : ĭ
94
+ sub "\u043A", "k" # к
95
+ sub "\u043B", "l" # л
96
+ sub "\u043C", "m" # м
97
+ sub "\u043D", "n" # н
98
+ sub "\u043E", "o" # о
99
+ sub "\u043F", "p" # п
100
+ sub "\u0440", "r" # р
101
+ sub "\u0441", "s" # с
102
+ sub "\u0442", "t" # т
103
+ sub "\u0443", "u" # у
104
+ sub "\u045E", "ŭ" # ў : ŭ
105
+ sub "\u0444", "f" # ф
106
+ sub "\u0445", "kh" # х
107
+ sub "\u0446", "ts" # Ц
108
+ sub "\u0447", "ch" # ч
109
+ sub "\u0448", "sh" # ш
110
+ sub "\u044B", "y" # ы
111
+ sub "\u044C", "ʹ" # ь : ʹ
112
+ sub "\u044D", "ė" # э : ė
113
+ sub "\u044E", "i͡u" # ю : i͡u
114
+ sub "\u044F", "i͡a" # я : i͡a
115
+ }
116
+
117
+ }
118
+
@@ -0,0 +1,225 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:ben
5
+ source_script: Beng
6
+ destination_script: Latn
7
+ name: Bengali Romanization, 1997
8
+ url: http://catdir.loc.gov/catdir/cpso/romanization/bengali.pdf
9
+ creation_date: 1997
10
+ description: |
11
+ ALA-LC Romanization table for Bengali
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are
16
+ listed; the forms used for vowels following a consonant can be found in
17
+ grammars; no distinction between the two is made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters
21
+ and is supplied in transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript symbol ( ্ )
25
+ called hasanta or birāma.
26
+
27
+ - ব is used both as a labial and as a semivowel. When it occurs as the
28
+ second or subsequent consonant of a consonant cluster, it is
29
+ transliterated va. When ব is doubled, it is transliterated bba.
30
+
31
+ - Candrabindu before guttural, palatal, cerebral, and dental occlusives
32
+ is transliterated n̐. Before labials, sibilants, semivowels, the
33
+ aspirate, vowels, and in final position it is transliterated m̐.
34
+
35
+ - When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
36
+ }
37
+
38
+ tests {
39
+ test "আমার সোনার বাংলা, আমি তোমায় ভালোবাসি।\nচিরদিন তোমার আকাশ, তোমার বাতাস, আমার প্রাণে বাজায় বাঁশি॥\nও মা, ফাগুনে তোর আমের বনে ঘ্রাণে পাগল করে, মরি হায়, হায় রে—\nও মা, অঘ্রাণে তোর ভরা ক্ষেতে আমি কী দেখেছি মধুর হাসি॥\n\nকী শোভা, কী ছায়া গো, কী স্নেহ, কী মায়া গো—\nকী আঁচল বিছায়েছ বটের মূলে, নদীর কূলে কূলে।\nমা, তোর মুখের বাণী আমার কানে লাগে সুধার মতো,\nমরি হায়, হায় রে—\nমা, তোর বদনখানি মলিন হলে, ও মা, আমি নয়নজলে ভাসি॥", "āmāra sonāra bāṃlā, āmi tomāẏa bhālobāsi।\nciradina tomāra ākāśa, tomāra bātāsa, āmāra prāṇe bājāẏa bān̐śi॥\no mā, phāgune tora āmera bane ghrāṇe pāgala kare, mari hāẏa, hāẏa re—\no mā, aghrāṇe tora bharā kshete āmi kī dekhechi madhura hāsi॥\n\nkī śobhā, kī chāyaṛā go, kī sneha, kī māyaṛā go—\nkī ām̐cala bichāyaṛecha baṭera mūle, nadīra kūle kūle।\nmā, tora mukhera bāṇī āmāra kāne lāge sudhāra mato,\nmari hāẏa, hāẏa re—\nmā, tora badanakhāni malina hale, o mā, āmi naẏanajale bhāsi॥"
40
+ test "ট্রাম্প-বাইডেন মহারণ: জয় দাবি দুজনেরই", "ṭrāmpa-bāiḍena mahāraṇa: jaẏa dābi dujanerai"
41
+ test "রিপাবলিকান গভর্নর ডগ ডসি বলেছেন, ফলাফল নিয়ে এখনই কথা বলার সময় আসেনি।", "ripābalikāna gabharnara ḍaga ḍasi balechena, phalāphala niẏe ekhanai kathā balāra samaẏa āseni।"
42
+ test "অনেক আগে থেকেই ট্রাম্প ফ্লোরিডায় জিতে গেছেন বলে গণমাধ্যমগুলোতে তুলে ধরা হচ্ছে", "aneka āge thekei ṭrāmpa phloriḍāẏa jite gechena bale gaṇamādhyamagulote tule dharā hacche"
43
+ test "করোনায় আরও ২১ মৃত্যু, নতুন শনাক্ত ১৫১৭", "karonāẏa ārao 21 mṛtyu, natuna śanākta 1517"
44
+ test "শালিক পাখিকে পোষ মানানোর মতো কঠিন কাজ করা কিশোর রোহানের বাড়ি কুষ্টিয়া শহরের পিটিআই সড়কে।", "śālika pākhike posha mānānora mato kaṭhina kāja karā kiśora rohānera bāṛi kushṭiẏā śaharera piṭiāi saṛake।"
45
+ test "সুইং স্টেটের সর্বশেষ অবস্থা দেখে মনে হচ্ছে, দুজনের ভাগ্য দুলছে পেন্ডুলামে।", "suiṃ sṭeṭera sarbaśesha abasthā dekhe mane hacche, dujanera bhāgya dulache penḍulāme।"
46
+ test "২০১৬ সালের নির্বাচনে বহিরাগত হিসেবেই ডোনাল্ড ট্রাম্পের রাজনীতিতে আগমন", "2016 sālera nirbācane bahirāgata hisebei ḍonālḍa ṭrāmpera rājanītite āgamana"
47
+ test "কই সঙ্গে রাজনীতির পাদপ্রদীপ থেকে সম্পূর্ণ বাইরে থাকা তাঁর পরিবারও চলে আসে রাজনীতির আলোচনায়", "kai saṅge rājanītira pādapradīpa theke sampūrṇa bāire thākā tān̐ra paribārao cale āse rājanītira ālocanāẏa"
48
+ test "নির্বাচনী প্রচারের সময় প্রেসিডেন্ট ডোনাল্ড ট্রাম্পের পরিবারের সদস্যরা মাঠে নেমেছেন", "nirbācanī pracārera samaẏa presiḍenṭa ḍonālḍa ṭrāmpera paribārera sadasyarā māṭhe nemechena"
49
+ test "তাঁরা সমর্থকদের উদ্দেশ্যে বলেছেন, এ নির্বাচন শুধু প্রেসিডেন্ট ডোনাল্ড ট্রাম্পের প্রতি নয়", "tān̐rā samarthakadera uddeśye balechena, e nirbācana śudhu presiḍenṭa ḍonālḍa ṭrāmpera prati naẏa"
50
+ test "স্মার্টফোন কিনতে ৮ হাজার করে ঋণ পাবেন ৪১৫০১ শিক্ষার্থী", "smārṭaphona kinate 8 hājāra kare ṛṇa pābena 41501 śikshārthī"
51
+ test "বার্সা সমর্থকদের নিয়ে উদ্‌যাপনের কথা গিলতে হলো ভিদালকে", "bārsā samarthakadera niẏe ud‌yāpanera kathā gilate halo bhidālake"
52
+ test "য়ে", "yaṛe"
53
+ }
54
+
55
+ aliases {
56
+ # A different name for this alias can be more fitting...
57
+ def_alias ben_special, any("\u09be\u09bf\u09c0\u09c1\u09c2\u09c3\u09c7\u09c8\u09cb\u09cc\u09cd")
58
+ }
59
+
60
+ stage {
61
+ # RULES
62
+ #rule II
63
+ sub "ক", "k", after: ben_special
64
+ sub "খ", "kh", after: ben_special
65
+ sub "গ", "g", after: ben_special
66
+ sub "ঘ", "gh", after: ben_special
67
+ sub "ঙ", "ṅ", after: ben_special
68
+ sub "চ", "c", after: ben_special
69
+ sub "ছ", "ch", after: ben_special
70
+ sub "জ", "j", after: ben_special
71
+ sub "ঝ", "jh", after: ben_special
72
+ sub "ঞ", "ñ", after: ben_special
73
+ sub "ট", "ṭ", after: ben_special
74
+ sub "ঠ", "ṭh", after: ben_special
75
+ sub "ড", "ḍ", after: ben_special
76
+ sub "ড়", "ṛ", after: ben_special
77
+ sub any("ড়"), "ṛ", after: ben_special # 2 combining characters, why we need any()? - weird
78
+ sub "ঢ", "ḍh", after: ben_special
79
+ sub "ঢ়", "ṛh", after: ben_special # 2 combining characters, was any()
80
+ sub "ণ", "ṇ", after: ben_special
81
+ sub "ত", "t", after: ben_special
82
+ sub "ৎ", "ṯ", after: ben_special
83
+ sub "থ", "th", after: ben_special
84
+ sub "দ", "d", after: ben_special
85
+ sub "ধ", "dh", after: ben_special
86
+ sub "ন", "n", after: ben_special
87
+ sub "প", "p", after: ben_special
88
+ sub "ফ", "ph", after: ben_special
89
+ sub "ব", "b", after: ben_special
90
+ sub "ভ", "bh", after: ben_special
91
+ sub "ম", "m", after: ben_special
92
+ sub "য", "y", after: ben_special
93
+ sub "য়", "ẏ", after: ben_special # 2 combining characters
94
+ sub "য়", "ẏ", after: ben_special # But this was any() in the previous version
95
+ sub "র", "r", after: ben_special
96
+ sub "ল", "l", after: ben_special
97
+ sub "শ", "ś", after: ben_special
98
+ sub "ষ", "sh", after: ben_special
99
+ sub "স", "s", after: ben_special
100
+ sub "হ", "h", after: ben_special
101
+
102
+ # Rule III
103
+ sub "ବ", "bba", after: "\u09AC"
104
+ # Rule V
105
+ sub "\u0981", "m̐", after: any("কখগঘঙচছজঝঞটঠডডঢঢণতৎথদধন")
106
+ sub "\u0b01", "m̐", after: boundary
107
+
108
+
109
+ # CHARACTERS
110
+ parallel {
111
+
112
+ # Vowels and Diphthongs
113
+
114
+ sub "অ", "a"
115
+ sub "আ", "ā"
116
+ sub "ই", "i"
117
+ sub "ঈ", "ī"
118
+ sub "উ", "u"
119
+ sub "ঊ", "ū"
120
+ sub "এ", "e"
121
+ sub "ঐ", "ai"
122
+ sub "ও", "o"
123
+ sub "ঔ", "au"
124
+ sub "ঋ", "ṛ"
125
+ sub "ৠ", "ṝ"
126
+ sub "ঌ", "ḹ"
127
+
128
+ # Consonants
129
+ # Gutturals
130
+ sub "ক", "ka"
131
+ sub "খ", "kha"
132
+ sub "গ", "ga"
133
+ sub "ঘ", "gha"
134
+ sub "ঙ", "ṅa"
135
+
136
+ # Palatals
137
+ sub "চ", "ca"
138
+ sub "ছ", "cha"
139
+ sub "জ", "ja"
140
+ sub "ঝ", "jha"
141
+ sub "ঞ", "ña"
142
+
143
+ # Cerebrals
144
+ sub "ট", "ṭa"
145
+ sub "ঠ", "ṭha"
146
+ sub "ড", "ḍa"
147
+ sub "ড়", "ṛa"
148
+ sub "ড়", "ṛa"
149
+ sub "ঢ", "ḍha"
150
+ sub "ঢ়", "ṛha"
151
+ sub "ণ", "ṇa"
152
+
153
+ # Dentals
154
+ sub "ত", "ta"
155
+ sub "ৎ", "ṯa"
156
+ sub "থ", "tha"
157
+ sub "দ", "da"
158
+ sub "ধ", "dha"
159
+ sub "ন", "na"
160
+
161
+ # Labials
162
+ sub "প", "pa"
163
+ sub "ফ", "pha"
164
+ sub "ব", "ba" # see Note 3
165
+ sub "ভ", "bha"
166
+ sub "ম", "ma"
167
+
168
+ # Semivowels
169
+ sub "য", "ya"
170
+ sub "য়", "ẏa"
171
+ sub "য়", "ẏa"
172
+ sub "র", "ra"
173
+ sub "ল", "la"
174
+
175
+ # Sibilants
176
+ sub "শ", "śa"
177
+ sub "ষ", "sha"
178
+ sub "স", "sa"
179
+
180
+ # Aspirate
181
+ sub "হ", "ha"
182
+
183
+ # Anusvāra
184
+ sub "ং", "ṃ"
185
+
186
+ # Bisarga
187
+ sub "ঃ", "ḥ"
188
+
189
+ # Candrabindu (anunāsika)
190
+ sub "\u0981", "n̐"
191
+
192
+ # Abagraha (see Note 5)
193
+ sub "ऽ", "’" # (apostrophe)
194
+
195
+
196
+ # Medials # Needed for connecting constants
197
+
198
+ sub "\u09be", "ā"
199
+ sub "\u09bf", "i"
200
+ sub "\u09c0", "ī"
201
+ sub "\u09c1", "u"
202
+ sub "\u09c2", "ū"
203
+ sub "\u09c3", "ṛ"
204
+ sub "\u09c7", "e"
205
+ sub "\u09c8", "ai"
206
+ sub "\u09cb", "o"
207
+ sub "\u09cc", "au"
208
+ sub "\u09cd", ""
209
+
210
+ #Numbers
211
+
212
+ sub "০", "0"
213
+ sub "১", "1"
214
+ sub "২", "2"
215
+ sub "৩", "3"
216
+ sub "৪", "4"
217
+ sub "৫", "5"
218
+ sub "৬", "6"
219
+ sub "৭", "7"
220
+ sub "৮", "8"
221
+ sub "৯", "9"
222
+ }
223
+
224
+ compose
225
+ }
@@ -0,0 +1,135 @@
1
+ metadata {
2
+ authority_id: alalc
3
+ id: 2017
4
+ language: iso-639-2:ben
5
+ source_script: Beng
6
+ destination_script: Latn
7
+ name: Bengali Romanization, 2017
8
+ url: https://www.loc.gov/catdir/cpso/romanization/bengali.pdf
9
+ creation_date: 2017
10
+ description: |
11
+ ALA-LC Romanization table for Bengali
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are
16
+ listed; the forms used for vowels following a consonant can be found in
17
+ grammars; no distinction between the two is made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters
21
+ and is supplied in transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript symbol ( ্ )
25
+ called hasanta or birāma.
26
+
27
+ - ব is used both as a labial and as a semivowel. When it occurs as the
28
+ second or subsequent consonant of a consonant cluster, it is
29
+ transliterated va. When ব is doubled, it is transliterated bba.
30
+
31
+ - Candrabindu before guttural, palatal, cerebral, and dental occlusives
32
+ is transliterated n̐. Before labials, sibilants, semivowels, the
33
+ aspirate, vowels, and in final position it is transliterated m̐.
34
+
35
+ - When doubled, abagraha is transliterated by two apostrophes ( ’’ ).
36
+ }
37
+
38
+ tests {
39
+ test "র্ক", "rka"
40
+ test "গ্র", "gra"
41
+ test "ত্য", "tya"
42
+ }
43
+
44
+ dependency "un-ben-Beng-Latn-2016", as: benglatn
45
+
46
+
47
+ stage {
48
+ run map.benglatn.stage.main
49
+
50
+ # CHARACTERS
51
+ parallel {
52
+
53
+ # I. Vowels and Diphthongs (see Note 1)
54
+
55
+ sub "অ", "a"
56
+ sub "ৠ", "ṝ"
57
+ sub "আ", "ā"
58
+ sub "ঌ", "ḹ"
59
+ sub "ই", "I"
60
+ sub "এ", "e"
61
+ sub "ঈ", "ī"
62
+ sub "ঐ", "ai"
63
+ sub "উ", "u"
64
+ sub "ও", "o"
65
+ sub "ঊ", "ū"
66
+ sub "ঔ", "au"
67
+ sub "ঋ", "ṛ"
68
+
69
+ # II. Consonants (see Note 2)
70
+ # Gutturals
71
+ sub "ক", "ka"
72
+ sub "খ", "kha"
73
+ sub "গ", "ga"
74
+ sub "ঘ", "gha"
75
+ sub "ঙ", "ṅa"
76
+
77
+ # Palatals
78
+ sub "চ", "ca"
79
+ sub "ছ", "cha"
80
+ sub "জ", "ja"
81
+ sub "ঝ", "jha"
82
+ sub "ঞ", "ña"
83
+
84
+ # Cerebrals
85
+ sub "ট", "ṭa"
86
+ sub "ঠ", "ṭha"
87
+ sub "ড", "ḍa"
88
+ sub "ড়", "ṛa"
89
+ sub "ঢ", "ḍha"
90
+ sub "ঢ়", "ṛha"
91
+ sub "ণ", "ṇa"
92
+
93
+ # Dentals
94
+ sub "ত", "ta"
95
+ sub "ৎ", "t"
96
+ sub "থ", "tha"
97
+ sub "দ", "da"
98
+ sub "ধ", "dha"
99
+ sub "ন", "na"
100
+
101
+ # Labials
102
+ sub "প", "pa"
103
+ sub "ফ", "pha"
104
+ sub "ব", "ba" # see Note 3
105
+ sub "ভ", "bha"
106
+ sub "ম", "ma"
107
+
108
+ # Semivowels
109
+ sub "য", "ya"
110
+ sub "য়", "ẏa"
111
+ sub "র", "ra"
112
+ sub "ল", "la"
113
+ sub "ব", "ba" # see Note 3
114
+
115
+ # Sibilants
116
+ sub "শ", "śa"
117
+ sub "ষ", "sha"
118
+ sub "স", "sa"
119
+
120
+ # Aspirate
121
+ sub "হ", "ha"
122
+
123
+ # Anusvāra
124
+ sub " ং", "ṃ"
125
+
126
+ # Bisarga
127
+ sub " ঃ", "ḥ"
128
+
129
+ # Candrabindu (anunāsika) see note 4
130
+ sub "\u0981", "n̐" # ঁ : n̐, m̐
131
+
132
+ # Abagraha (see Note 5)
133
+ sub "ऽ", "’" # (apostrophe)
134
+ }
135
+ }