interscript-maps 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,156 @@
1
+ metadata {
2
+ authority_id: royin
3
+ id: 1968-chained
4
+ language: iso-639-2:tha
5
+ source_script: Thai
6
+ destination_script: Latn
7
+ name: Royal Thai General System of Transcription (1968)
8
+ url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
+ creation_date: 1968
10
+ adoption_date:
11
+ description: |
12
+ This map loads two external maps to convert Thai text first into phonemic Thai,
13
+ and then into IPA transcription.
14
+
15
+ The IPA transcription will then be handled by this map, and converted into
16
+ Royal Thai General System of Transcription (1968).
17
+
18
+ The first two parts are done via two external maps.
19
+
20
+ notes: |
21
+ The conversion from Thai to Phonemic Thai is still work-in-progress.
22
+ }
23
+
24
+ tests {
25
+ test "สะพาน", "saphan"
26
+ test "ลานตา", "lanta"
27
+ test "บาง", "bang"
28
+ test "สมุทร", "samut"
29
+ test "ลำ", "lam"
30
+ test "สิงห์", "sing"
31
+ test "บุรี", "buri"
32
+ test "สตึก", "satuk"
33
+ test "พืช", "phut"
34
+ test "บรบือ", "borabu"
35
+ test "ภู", "phu"
36
+ test "ปะนาเระ", "panare"
37
+ test "เพ็ญ", "phen"
38
+ # - source: "เขน"
39
+ # expected: "khen"
40
+ test "แซะ", "sae"
41
+ # - source: "สะแก"
42
+ # expected: "sakae"
43
+ test "พะโต๊ะ", "phato"
44
+ test "ลพ", "lop"
45
+ # - source: "สามโก้"
46
+ # expected: "samko"
47
+ test "เกาะ", "ko"
48
+ test "บ่อ", "bo"
49
+ test "เซอะ", "soe"
50
+ test "อำเภอ", "amphoe"
51
+ test "เนิน", "noen"
52
+ # - source: "เพียะ"
53
+ # expected: "phia"
54
+ test "เทียน", "thian"
55
+ # - source: "เกือะ"
56
+ # expected: "kua"
57
+ test "เมือง", "muang"
58
+ # - source: "ผัวะ"
59
+ # expected: "phua"
60
+ test "บัว", "bua"
61
+ # - source: "ควน"
62
+ # expected: "khuan"
63
+ test "ใหญ่", "yai"
64
+ # - source: "ไผ่"
65
+ # expected: "phai"
66
+ test "ชัย", "chai"
67
+ test "ไทย", "thai"
68
+ # - source: "ปาย"
69
+ # expected: "pai"
70
+ test "เจ้า", "chao"
71
+ test "ข้าว", "khao"
72
+ # - source: "กุย"
73
+ # expected: "kui"
74
+ test "โดย", "doi"
75
+ # - source: "ดอย"
76
+ # expected: "doi"
77
+ # - source: "งิ้ว"
78
+ # expected: "ngiu"
79
+ test "เร็ว", "reo"
80
+ # - source: "เลว"
81
+ # expected: "leo"
82
+ # - source: "เลย"
83
+ # expected: "loei"
84
+ # - source: "เดือย"
85
+ # expected: "duai"
86
+ # - source: "ห้วย"
87
+ # expected: "huai"
88
+ test "แมว", "maeo"
89
+ test "เขียว", "khieu"
90
+ }
91
+
92
+ # This map has been partially converted by the bin/maps_v1_to_v2 script
93
+ # The section below requires human attention. Remember to remove this
94
+ # comment and move the converted map to 'maps/' directory. Please also
95
+ # take note that the maps-staging directory will be cleaned up whenever
96
+ # you run the bin/maps_v1_to_v2 script. You should particularly be
97
+ # concerned about any regular expressions found in this file and about
98
+ # advanced expressions in parallel {} parts, and also about the order
99
+ # of particular parts of the stage.
100
+
101
+ dependency "var-tha-Thai-Thai-phonemic", as: thaiphonemic
102
+ dependency "var-tha-Thai-Zsym-ipa", as: thaizsym
103
+
104
+ stage {
105
+ run map.thaiphonemic.stage.main
106
+ run map.thaizsym.stage.main
107
+
108
+ # DICTIONARY
109
+ parallel {
110
+
111
+ sub "̯", ""
112
+ sub "̚", ""
113
+
114
+ sub "ʔ", ""
115
+ sub "ː", ""
116
+
117
+ sub "t͡ɕʰ", "ch"
118
+ sub "t͡ɕ", "ch"
119
+ sub "ŋ", "ng"
120
+ sub "j", "y"
121
+ sub "ɔ", "o"
122
+ sub "ɤ", "oe"
123
+ sub "ɛ", "ae"
124
+ sub "ɯ", "u"
125
+ sub "ʰ", "h"
126
+
127
+ sub "aːw", "ao"
128
+ sub "aw", "ao"
129
+ sub "a̯w", "eu"
130
+ sub "eːw", "eo"
131
+ sub "ew", "eo"
132
+ sub "ɛːw", "aeo"
133
+ sub "ɛw", "aeo"
134
+ sub "iːw", "iu"
135
+ sub "iw", "iu"
136
+
137
+ sub "aːj", "ai"
138
+ sub "aj", "ai"
139
+ sub "a̯j", "ai"
140
+ sub "ɔːj", "oi"
141
+ sub "ɔj", "oi"
142
+ sub "oːj", "oi"
143
+ sub "oj", "oi"
144
+ sub "ɤːj", "oei"
145
+ sub "ɤj", "oei"
146
+ sub "uːj", "ui"
147
+ sub "uj", "ui"
148
+ }
149
+
150
+ # RULES
151
+ sub any("˩˨˧˦˥"), ""
152
+ sub line_start, "."
153
+
154
+ # POSTRULES
155
+ sub ".", ""
156
+ }
@@ -0,0 +1,161 @@
1
+ metadata {
2
+ authority_id: royin
3
+ id: 1999-chained
4
+ language: iso-639-2:tha
5
+ source_script: Thai
6
+ destination_script: Latn
7
+ name: Royal Thai General System of Transcription (1999)
8
+ url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
+ creation_date: 1999
10
+ adoption_date:
11
+ description: |
12
+ This map loads two external maps to convert Thai text first into phonemic Thai,
13
+ and then into IPA transcription.
14
+
15
+ The IPA transcription will then be handled by this map, and converted into
16
+ Royal Thai General System of Transcription (1999)
17
+
18
+ The first two parts are done via two external maps.
19
+
20
+ notes: |
21
+ The conversion from Thai to Phonemic Thai is still work-in-progress.
22
+ }
23
+
24
+ tests {
25
+ test "สะพาน", "saphan"
26
+ test "ลานตา", "lanta"
27
+ test "บาง", "bang"
28
+ test "สมุทร", "samut"
29
+ test "ลำ", "lam"
30
+ test "สิงห์", "sing"
31
+ test "บุรี", "buri"
32
+ test "สตึก", "satuek"
33
+ test "พืช", "phuet"
34
+ test "บรบือ", "borabue"
35
+ test "ภู", "phu"
36
+ test "ปะนาเระ", "panare"
37
+ test "เพ็ญ", "phen"
38
+ # - source: "เขน"
39
+ # expected: "khen"
40
+ test "แซะ", "sae"
41
+ # - source: "สะแก"
42
+ # expected: "sakae"
43
+ test "พะโต๊ะ", "phato"
44
+ test "ลพ", "lop"
45
+ # - source: "สามโก้"
46
+ # expected: "samko"
47
+ test "เกาะ", "ko"
48
+ test "บ่อ", "bo"
49
+ test "เซอะ", "soe"
50
+ test "อำเภอ", "amphoe"
51
+ test "เนิน", "noen"
52
+ # - source: "เพียะ"
53
+ # expected: "phia"
54
+ test "เทียน", "thian"
55
+ # - source: "เกือะ"
56
+ # expected: "kuea"
57
+ test "เมือง", "mueang"
58
+ # - source: "ผัวะ"
59
+ # expected: "phua"
60
+ test "บัว", "bua"
61
+ # - source: "ควน"
62
+ # expected: "khuan"
63
+ test "ใหญ่", "yai"
64
+ # - source: "ไผ่"
65
+ # expected: "phai"
66
+ test "ชัย", "chai"
67
+ test "ไทย", "thai"
68
+ # - source: "ปาย"
69
+ # expected: "pai"
70
+ test "เจ้า", "chao"
71
+ test "ข้าว", "khao"
72
+ # - source: "กุย"
73
+ # expected: "kui"
74
+ test "โดย", "doi"
75
+ # - source: "ดอย"
76
+ # expected: "doi"
77
+ # - source: "งิ้ว"
78
+ # expected: "ngio"
79
+ test "เร็ว", "reo"
80
+ # - source: "เลว"
81
+ # expected: "leo"
82
+ # - source: "เลย"
83
+ # expected: "loei"
84
+ # - source: "เดือย"
85
+ # expected: "dueai"
86
+ # - source: "ห้วย"
87
+ # expected: "huai"
88
+ test "แมว", "maeo"
89
+ test "เขียว", "khiao"
90
+ }
91
+
92
+ # This map has been partially converted by the bin/maps_v1_to_v2 script
93
+ # The section below requires human attention. Remember to remove this
94
+ # comment and move the converted map to 'maps/' directory. Please also
95
+ # take note that the maps-staging directory will be cleaned up whenever
96
+ # you run the bin/maps_v1_to_v2 script. You should particularly be
97
+ # concerned about any regular expressions found in this file and about
98
+ # advanced expressions in parallel {} parts, and also about the order
99
+ # of particular parts of the stage.
100
+
101
+ dependency "var-tha-Thai-Thai-phonemic", as: thaiphonemic
102
+ dependency "var-tha-Thai-Zsym-ipa", as: thaizsym
103
+
104
+ stage {
105
+ run map.thaiphonemic.stage.main
106
+ run map.thaizsym.stage.main
107
+
108
+ # DICTIONARY
109
+ parallel {
110
+
111
+ sub "̯", ""
112
+ sub "̚", ""
113
+
114
+ sub "ʔ", ""
115
+ sub "ː", ""
116
+
117
+ sub "t͡ɕʰ", "ch"
118
+ sub "t͡ɕ", "ch"
119
+ sub "ŋ", "ng"
120
+ sub "j", "y"
121
+ sub "ɔ", "o"
122
+ sub "ɤ", "oe"
123
+ sub "ɛ", "ae"
124
+ sub "ɯ", "ue" # New spelling, was u in 1968
125
+ sub "ʰ", "h"
126
+
127
+ sub "aːw", "ao"
128
+ sub "aw", "ao"
129
+ sub "a̯w", "ao" # New spelling, was eu in 1968
130
+ sub "eːw", "eo"
131
+ sub "ew", "eo"
132
+ sub "ɛːw", "aeo"
133
+ sub "ɛw", "aeo"
134
+ sub "iːw", "io" # New spelling, was iu in 1968
135
+ sub "iw", "io" # New spelling, was iu in 1968
136
+
137
+ sub "aːj", "ai"
138
+ sub "aj", "ai"
139
+ sub "a̯j", "ai"
140
+ sub "ɔːj", "oi"
141
+ sub "ɔj", "oi"
142
+ sub "oːj", "oi"
143
+ sub "oj", "oi"
144
+ sub "ɤːj", "oei"
145
+ sub "ɤj", "oei"
146
+ sub "uːj", "ui"
147
+ sub "uj", "ui"
148
+ }
149
+
150
+ # RULES
151
+ sub any("˩˨˧˦˥"), ""
152
+ sub line_start, "."
153
+
154
+ # CHARACTERS
155
+ parallel {
156
+
157
+ }
158
+
159
+ # POSTRULES
160
+ sub ".", ""
161
+ }
@@ -0,0 +1,78 @@
1
+ metadata {
2
+ authority_id: royin
3
+ id: 1999
4
+ language: iso-639-2:tha
5
+ source_script: Thai
6
+ destination_script: Latn
7
+ name: Royal Thai General System of Transcription (1999)
8
+ url: http://www.royin.go.th/wp-content/uploads/royin-ebook/276/FileUpload/758_6484.pdf
9
+ creation_date: 1999
10
+ adoption_date:
11
+ description:
12
+
13
+ notes: |
14
+ }
15
+
16
+ tests {
17
+ test "ภาษาไทย", "phasathai"
18
+ test "ไทย", "thai"
19
+ test "เชียงใหม่", "chiangmai"
20
+ test "ใหม่", "mai"
21
+ test "ใคร", "khrai"
22
+ test "ที่", "thi"
23
+ test "เป็น", "pen"
24
+ test "ใน", "nai"
25
+ test "การ", "kan"
26
+ test "มี", "mi"
27
+ test "ได้", "dai"
28
+ test "ของ", "khong"
29
+ test "ไม่", "mai"
30
+ test "สถานีปางต้นผึ้ง", "sathanipangtonphueng"
31
+ test "ไพศาลี", "phaisali"
32
+ test "โรงเรียนไม้เรียงประชาสรรค์", "rongrianmairiangprachasan"
33
+ }
34
+
35
+ # This map has been partially converted by the bin/maps_v1_to_v2 script
36
+ # The section below requires human attention. Remember to remove this
37
+ # comment and move the converted map to 'maps/' directory. Please also
38
+ # take note that the maps-staging directory will be cleaned up whenever
39
+ # you run the bin/maps_v1_to_v2 script. You should particularly be
40
+ # concerned about any regular expressions found in this file and about
41
+ # advanced expressions in parallel {} parts, and also about the order
42
+ # of particular parts of the stage.
43
+
44
+
45
+ stage {
46
+
47
+ # DICTIONARY
48
+ parallel {
49
+ sub "ʰ", "h"
50
+ sub "c", "ch"
51
+ sub "ː", ""
52
+ sub "ŋ", "ng"
53
+ sub "j", "i"
54
+ sub "w", "o"
55
+ sub "ɔ", "o"
56
+ sub "ɤ", "oe"
57
+ sub "ɛ", "ae"
58
+ sub "ɯ", "ue"
59
+ sub "ʔ", ""
60
+ sub "t͡ɕ", "c"
61
+ sub any_character, ""
62
+ }
63
+
64
+ # RULES
65
+
66
+ # CHARACTERS
67
+ parallel {
68
+ sub any("0".."9"), ""
69
+
70
+ }
71
+
72
+ # POSTRULES
73
+ sub "chh", "ch"
74
+
75
+ }
76
+
77
+ # This map contains transcription and probably depends on seq2seq:
78
+ # transcription: sequitur.pythainlp_lexicon
@@ -0,0 +1,53 @@
1
+ metadata {
2
+ authority_id: var
3
+ id: phonemic
4
+ language: iso-639-2:tha
5
+ source_script: Thai
6
+ destination_script: Thai
7
+ name: Phonemic Thai (Royal Thai General Dictionary)
8
+ url:
9
+ creation_date:
10
+ adoption_date:
11
+ description:
12
+ This map performs two tasks.
13
+
14
+ First the text is segmented using a dictionary.
15
+ Then Thai texts will be sent to an external module to get converted into
16
+ Phonemic Thai.
17
+
18
+ Note that the accuracy for vowel length distinction and certain tonal alternation
19
+ is low.
20
+
21
+ notes: |
22
+ }
23
+
24
+ tests {
25
+ test "ที่เปิดขวด", "ที่-เปิด-ขวด"
26
+ test "พื้นหลัง", "พื้น-หฺลัง"
27
+ test "สมชาย", "สม-ชาย"
28
+ test "อ่อนข้อ", "อ็่อน-ค่อ"
29
+ test "โครยอ", "โค-ระ-ยอ"
30
+ test "ไล่ออก", "ไล่-ออก"
31
+ test "ไส้เลื่อน", "ไส้-เลื่อน"
32
+ test "ความวาว", "คฺวาม-วาว"
33
+ test "ไอกรน", "ไอ-กฺรน"
34
+ test "ไอซียู", "ไอ-ซี-ยู"
35
+ test "ไอซ์แลนด์", "ไอ๊ส-แลน"
36
+ }
37
+
38
+ # This map has been partially converted by the bin/maps_v1_to_v2 script
39
+ # The section below requires human attention. Remember to remove this
40
+ # comment and move the converted map to 'maps/' directory. Please also
41
+ # take note that the maps-staging directory will be cleaned up whenever
42
+ # you run the bin/maps_v1_to_v2 script. You should particularly be
43
+ # concerned about any regular expressions found in this file and about
44
+ # advanced expressions in parallel {} parts, and also about the order
45
+ # of particular parts of the stage.
46
+
47
+ # Not yet implemented
48
+
49
+ stage {
50
+ }
51
+
52
+ # This map contains transcription and probably depends on seq2seq:
53
+ # transcription: sequitur.wiktionary_phonemic