interscript-maps 2.0.5

Sign up to get free protection for your applications and to get access to all the features.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,48 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 1984
4
+ language: iso-639-2:sme
5
+ source_script: Latn
6
+ destination_script: Latn
7
+ name: BGN/PCGN Northern Sami (North Lappish) 1984 Roman-Script Spelling Convention Agreement
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693794/ROMAN-SCRIPT_SPELLING_CONVENTIONS.pdf
9
+ creation_date: 1984
10
+
11
+ notes:
12
+ - |
13
+ The special letter Ŋ ŋ, known as eng, [Unicode: 014A, 014B] should be reproduced in that form whenever
14
+ encountered. In those instances when it cannot be reproduced, however, the letter Ń ń [Unicode: 0143, 0144]
15
+ may be substituted for it.
16
+ - |
17
+ In a further note additional to the 1984 agreement, other special letters should be retained as found:
18
+ Á á [Unicode: 00C1, 00E1],
19
+ Č č [Unicode: 010C, 010D],
20
+ Đ đ [Unicode: 0110, 0111],
21
+ Š š [Unicode: 0160, 0161],
22
+ Ŧ ŧ [Unicode: 0166, 0167],
23
+ Ž ž [Unicode: 017D, 017E].
24
+ }
25
+
26
+ tests {
27
+ # https://web.archive.org/web/20120918094122/http://www.uta.fi/~km56049/same/svocab.html
28
+ test "adjágas", "adjágas"
29
+ test "agálaš", "agálaš"
30
+ test "ÁEL", "ÁEL"
31
+ test "hčagastinárpu", "hčagastinárpu"
32
+ test "algŋa", "algńa"
33
+ test "Šveica", "Šveica"
34
+ test "MAŊŊIL", "MAŃŃIL"
35
+ test "giđa", "giđa"
36
+ test "ruoŧŧelaš", "ruoŧŧelaš"
37
+ test "skálžu", "skálžu"
38
+ }
39
+
40
+ stage {
41
+
42
+ # CHARACTERS
43
+ parallel {
44
+ sub "Ŋ", "Ń" # Ŋ => Ń
45
+ sub "ŋ", "ń" # ŋ => ń
46
+ }
47
+
48
+ }
@@ -0,0 +1,55 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 1962
4
+ language: iso-639-2:srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: TRANSLITERATION OF SERBIAN CYRILLIC
8
+ creation_date: 1962
9
+ confirmation_date: 1962
10
+ description: |
11
+ Serbo-Croatian, the official national language of Yugoslavia, is a single literary language.
12
+ In Serbian areas it is written in the cyrillic (Serbian) alphabet, while in Croatian areas it is
13
+ written in the roman (Croatian) alphabet.
14
+ Both the BGN and PCGN use the standard Croation equivalents for fomanizing the Serbian cyrillic
15
+ alphabet whenether romanized names are not available.
16
+
17
+ notes:
18
+ - The digraph dj(Dj) will occasionally be found as the Croatian equivalent of ђ(Ђ),
19
+ but the use of dj should be limited to those instances where it is found in roman sources.
20
+ }
21
+
22
+ tests {
23
+ test "Шупља Стена", "Šuplja Stena"
24
+ test "Чукарица", "Čukarica"
25
+ test "Црна Трава", "Crna Trava"
26
+ test "Херцег Нови", "Herceg Novi"
27
+ test "Улцињ", "Ulcinj"
28
+ test "Ужице", "Užice"
29
+ test "Тресаначка Река", "Tresanačka Reka"
30
+ test "Сјеница", "Sjenica"
31
+ test "Рожаје", "Rožaje"
32
+ test "Пљевља", "Pljevlja"
33
+ test "Оџаци", "Odžaci"
34
+ test "Никшић", "Nikšić"
35
+ test "Медвеђа", "Medveđa"
36
+ test "Лозница", "Loznica"
37
+ test "Књажевац", "Knjaževac"
38
+ test "Зрењанин", "Zrenjanin"
39
+ test "Житорађа", "Žitorađa"
40
+ test "Ервеник", "Ervenik"
41
+ test "Доње Љупче", "Donje Ljupče"
42
+ test "Гусиње", "Gusinje"
43
+ test "ГУСИЊЕ", "GUSINJE"
44
+ test "Врњачка Бања", "Vrnjačka Banja"
45
+ test "Бијело Поље", "Bijelo Polje"
46
+ test "Алибунар", "Alibunar"
47
+ }
48
+
49
+ dependency "bgnpcgn-srp-Cyrl-Latn-2005", as: cyrllatn
50
+
51
+ stage {
52
+
53
+ run map.cyrllatn.stage.main
54
+
55
+ }
@@ -0,0 +1,146 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 2005
4
+ language: iso-639-2:srp
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF SERBIAN, BGN/PCGN 2005 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816783/TABLE_OF_CORRESPONDENCES_FOR_SERBIAN.pdf
9
+ creation_date: 2005
10
+ confirmation_date: 2019-06
11
+ description: |
12
+ The tabulation below reflects the Serbian Cyrillic alphabet and the standard Roman script equivalents
13
+ used in both Serbia and Montenegro.
14
+
15
+ notes:
16
+ - The Serbian Cyrillic lowercase italic Д may sometimes be seen as g.
17
+ There is no specific Unicode encoding for this variant form so a comparable character
18
+ has been used here for illustrative purposes.
19
+
20
+ - The digraph dj(Dj) will occasionally be found as an alternative form of đ(Đ).
21
+
22
+ - The Serbian Cyrillic lowercase italic П may sometimes be seen as ӣ.
23
+ There is no specific Unicode encoding for this variant form so a comparable character
24
+ has been used here for illustrative purposes.
25
+
26
+ - The Serbian Cyrillic lowercase italic Т may sometimes be seen as w.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+
30
+ - |
31
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
32
+ in addition to the unmodified letters of the basic Roman script is:
33
+ | Đ (U+0110) | đ (U+0111) |
34
+ | Ž (U+017D) | ž (U+017E) |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Ć (U+0106) | ć (U+0107) |
37
+ | Dž (U+01C5)* | dž (U+01C6)* |
38
+ | Š (U+0160) | š (U+0161) |
39
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
40
+
41
+ - The Roman-script columns show only lowercase forms but, when applying the table,
42
+ uppercase and lowercase Roman letters as appropriate should be used.
43
+ }
44
+
45
+ tests {
46
+ test "Шупља Стена", "Šuplja Stena"
47
+ test "Чукарица", "Čukarica"
48
+ test "Црна Трава", "Crna Trava"
49
+ test "Херцег Нови", "Herceg Novi"
50
+ test "Улцињ", "Ulcinj"
51
+ test "Ужице", "Užice"
52
+ test "Тресаначка Река", "Tresanačka Reka"
53
+ test "Сјеница", "Sjenica"
54
+ test "Рожаје", "Rožaje"
55
+ test "Пљевља", "Pljevlja"
56
+ test "Оџаци", "Odžaci"
57
+ test "Никшић", "Nikšić"
58
+ test "Медвеђа", "Medveđa"
59
+ test "Лозница", "Loznica"
60
+ test "Књажевац", "Knjaževac"
61
+ test "Зрењанин", "Zrenjanin"
62
+ test "Житорађа", "Žitorađa"
63
+ test "Ервеник", "Ervenik"
64
+ test "Доње Љупче", "Donje Ljupče"
65
+ test "Гусиње", "Gusinje"
66
+ test "ГУСИЊЕ", "GUSINJE"
67
+ test "Врњачка Бања", "Vrnjačka Banja"
68
+ test "Бијело Поље", "Bijelo Polje"
69
+ test "Алибунар", "Alibunar"
70
+ }
71
+
72
+ aliases {
73
+ def_alias srp_multichar, any(["Lj", "Nj", "Dž"])
74
+ def_alias srp_latupper, any("A".."Z")
75
+ }
76
+
77
+ stage {
78
+ # CHARACTERS
79
+ parallel {
80
+ sub "А", "A"
81
+ sub "Б", "B"
82
+ sub "В", "V"
83
+ sub "Г", "G"
84
+ sub "Д", "D"
85
+ sub "Ђ", "Đ" # Đ
86
+ sub "Е", "E"
87
+ sub "Ж", "Ž" # Ž
88
+ sub "З", "Z"
89
+ sub "И", "I"
90
+ sub "Ј", "J"
91
+ sub "К", "K"
92
+ sub "Л", "L"
93
+ sub "Љ", "Lj"
94
+ sub "М", "M"
95
+ sub "Н", "N"
96
+ sub "Њ", "Nj"
97
+ sub "О", "O"
98
+ sub "П", "P"
99
+ sub "Р", "R"
100
+ sub "С", "S"
101
+ sub "Т", "T"
102
+ sub "Ћ", "Ć" # Ć
103
+ sub "У", "U"
104
+ sub "Ф", "F"
105
+ sub "Х", "H"
106
+ sub "Ц", "C"
107
+ sub "Ч", "Č" # Č
108
+ sub "Џ", "Dž" # Dž
109
+ sub "Ш", "Š" # Š
110
+ sub "а", "a"
111
+ sub "б", "b"
112
+ sub "в", "v"
113
+ sub "г", "g"
114
+ sub "д", "d"
115
+ sub "ђ", "đ" # đ
116
+ sub "е", "e"
117
+ sub "ж", "ž" # ž
118
+ sub "з", "z"
119
+ sub "и", "i"
120
+ sub "ј", "j"
121
+ sub "к", "k"
122
+ sub "л", "l"
123
+ sub "љ", "lj"
124
+ sub "м", "m"
125
+ sub "н", "n"
126
+ sub "њ", "nj"
127
+ sub "о", "o"
128
+ sub "п", "p"
129
+ sub "р", "r"
130
+ sub "с", "s"
131
+ sub "т", "t"
132
+ sub "ћ", "ć" # ć́
133
+ sub "у", "u"
134
+ sub "ф", "f"
135
+ sub "х", "h"
136
+ sub "ц", "c"
137
+ sub "ч", "č" # č
138
+ sub "џ", "dž" # dž
139
+ sub "ш", "š" # š
140
+ }
141
+
142
+ # POSTRULES
143
+ sub srp_multichar, upcase, before: srp_latupper
144
+ sub srp_multichar, upcase, after: srp_latupper
145
+ compose
146
+ }
@@ -0,0 +1,185 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 2007
4
+ language: iso-639-2:tat
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: TATAR TABLE OF CORRESPONDENCES CYRILLIC - ROMAN BGN/PCGN 2007 Agreement
8
+ url: https://geonames.nga.mil/gns/html/Romanization/TABLE%20OF%20CORRESPONDENCES%20FOR%20TATAR.pdf
9
+ creation_date: 2007
10
+ confirmation_date: 2017-11
11
+ description: |
12
+ Tatar is an official language within Respublika Tatarstan, one of the republics of the Russian
13
+ Federation. It will normally be encountered in Cyrillic script, in which case it should be romanized by means
14
+ of the Cyrillic-Roman table of correspondences given below.
15
+
16
+ notes:
17
+ - |
18
+ The alphabet portrayed in the above table is referred to as yaꞑalif-2.
19
+ A set of simpler characters is also encountered; this is known as zamanalif.
20
+ In this latter set, the alternative characters ä, ñ and ö are used for letters
21
+ 2, 17 and 19 respectively where the user has difficulty reproducing ə, ꞑ, and ө.
22
+ Please note that all three alternatives must be used as a set, and the letters should not be intermingled.
23
+ - Used only in borrowed words.
24
+ - The first option is used in words with back vowels, the second in words with front vowels (though this does not apply to borrowed words).
25
+ - yı/ye is used after a vowel (except и, ю), ъ and ь, also word-initially.
26
+ - w is used after a vowel.
27
+ - After ğ or q, ый is represented i
28
+ - Э is represented ’ after a vowel in words of Arabic origin.
29
+ - Ю and Я are represented ü and a/ä respectively after и.
30
+ - |
31
+ An inventory of letter-diacritic combinations, with their Unicode encoding, in addition to the unmodified letters
32
+ of the basic Roman script is:
33
+ Ə (U+018F) ə (U+0259)
34
+ Ğ (U+011E) ğ (U+011F)
35
+ İ (U+0130) ı (U+0131)
36
+ Ü (U+00DC) ü (U+00FC)
37
+ Ꞑ (U+A790) ꞑ (U+A791)
38
+ Ɵ (U+019F) ɵ (U+0275)
39
+ Ç (U+00C7) ç (U+00E7)
40
+ Ş (U+015E) ş (U+015F)
41
+ Ä (U+00C4) ä (U+00E4)
42
+ ’ (U+2019)
43
+ - |
44
+ The Roman-script columns show only lowercase forms but, when applying the table, uppercase and lowercase
45
+ Roman letters as appropriate should be used.
46
+ }
47
+
48
+ tests {
49
+ test "Гыйльмиев", "Ğil’miew" # # note[6] in the note it's Ğilmiev which incorrect according to the rules
50
+ # https://en.wikipedia.org/wiki/Tatar_alphabet
51
+ test "баеды", "bayıdı" # note[4]
52
+ test "кардәш", "qardəş"
53
+ test "калынлык һәм аеру билгесе", "qalınlıq həm ayıru bilgese" # note[4]
54
+ test "Барлык кешеләр дә азат һәм үз абруйлары һәм хокуклары ягыннан тиң булып туалар.\nАларга акыл һәм вөҗдан бирелгән һәм бер-берсенә карата туганнарча мөнасәбәттә булырга тиешләр.", "Barlıq keşelər də azat həm üz abruyları həm xoquqları yağınnan tiꞑ bulıp tualar.\nAlarğa aqıl həm wocdan birelgən həm ber-bersenə qarata tuğannarça monasəbəttə bulırğa tieşlər."
55
+ # https://www.azatliq.org/a/30820571.html
56
+ test "Әлдермештән Әлмәндәр", "Əldermeştən Əlməndər"
57
+ test "Әссәламү галәйкүм", "Əssəlamü ğaləyküm"
58
+ test "Танымаган кешегә", "Tanımağan keşegə" # note[3]
59
+ test "Иң әүвәл кул бирешеп күрешик", "İꞑ əwwəl qul bireşep küreşiq" # note[5]
60
+ test "Ялгышмыйсың", "Yalğışmıysıꞑ"
61
+ test "Нәкъ үзе", "Nəq üze"
62
+ test "Кирәгеннән артыгын", "Kirəgennən artığın" # note[3]
63
+ test "мәңгелеккә килмәгән", "məꞑgeleqkə kilməgən"
64
+ test "кулыңны куй", "qulıꞑnı quy"
65
+ test "Өммия", "Ommiä" # note[8]
66
+ test "Җиһангир", "Cihangir" # note[3]
67
+ }
68
+
69
+ stage {
70
+
71
+ # RULES
72
+ # note[3] http://www.hintfox.com/article/sistema-glasnih-zvykov-na-tatarskom-i-anglijskom-jazikah.html
73
+ # back vowels: у, а, ы, о,
74
+ # front vowels: е, ә, и, ө, ү, э
75
+ sub "Г", "G", after: any("ЕеƏәИиӨөҮүЭэ")
76
+ sub "г", "g", after: any("ЕеƏәИиӨөҮүЭэ")
77
+ sub "К", "K", after: any("ЕеƏәИиӨөҮүЭэ")
78
+ sub "к", "k", after: any("ЕеƏәИиӨөҮүЭэ")
79
+ sub "Ю", "Yü", after: any("ЕеƏәИиӨөҮүЭэ")
80
+ sub "ю", "yü", after: any("ЕеƏәИиӨөҮүЭэ")
81
+ sub "Я", "Yä", after: any("ЕеƏәИиӨөҮүЭэ")
82
+ sub "я", "yä", after: any("ЕеƏәИиӨөҮүЭэ")
83
+
84
+ # note[4]
85
+ sub "\u0415", "Yı", before: any("АаЕеƏәОоӨөҮүУуЫыЭэЯяЪъЬь")
86
+ sub "\u0435", "yı", before: any("АаЕеƏәОоӨөҮүУуЫыЭэЯяЪъЬь")
87
+
88
+ # note[5]
89
+ sub "\u0423", "W", before: any("АаЕеƏәИиОоӨөҮүУуЫыЭэЮюЯяЪъЬь")
90
+ sub "\u0443", "w", before: any("АаЕеƏәИиОоӨөҮүУуЫыЭэЮюЯяЪъЬь")
91
+ sub "\u04AE", "W", before: any("АаЕеƏәИиОоӨөҮүУуЫыЭэЮюЯяЪъЬь")
92
+ sub "\u04AF", "w", before: any("АаЕеƏәИиОоӨөҮүУуЫыЭэЮюЯяЪъЬь")
93
+
94
+ # note[6]
95
+ sub "ый", "i", before: any("Гг")
96
+
97
+ # note[8]
98
+ sub "\u042E", "Ü", before: any("Ии")
99
+ sub "\u044E", "ü", before: any("Ии")
100
+ sub "\u042F", "Ä", before: any("Ии")
101
+ sub "\u044F", "ä", before: any("Ии")
102
+
103
+
104
+ # CHARACTERS
105
+ parallel {
106
+ sub "А", "A" # А
107
+ sub "Ә", any("ƏÄ") # Ә => [Ə, Ä] note[1]
108
+ sub "Б", "B" # Б
109
+ sub "В", any("WV") # В note[2]
110
+ sub "Г", "Ğ" # Г => Ğ note[3]
111
+ sub "Д", "D" # Д
112
+ sub "Е", "E" # Е note[3] note[4]
113
+ sub "Ж", "J" # Ж
114
+ sub "Җ", "C" # Җ
115
+ sub "З", "Z" # З
116
+ sub "И", "İ" # И => İ
117
+ sub "Й", "Y" # Й
118
+ sub "К", "Q" # К note[3]
119
+ sub "Л", "L" # Л
120
+ sub "М", "M" # М
121
+ sub "Н", "N" # Н
122
+ sub "Ң", any("ꞐÑ") # Ң => [Ꞑ, Ñ] note[1]
123
+ sub "О", "O" # О
124
+ sub "Ө", any("OÖ") # Ө => [O, Ö] note[1]
125
+ sub "П", "P" # П
126
+ sub "Р", "R" # Р
127
+ sub "С", "S" # С
128
+ sub "Т", "T" # Т
129
+ sub "У", "U" # У note[5]
130
+ sub "Ү", "Ü" # Ү => Ü note[5]
131
+ sub "Ф", "F" # Ф
132
+ sub "Х", "Х" # Х
133
+ sub "Һ", "H" # Һ
134
+ sub "Ц", "Ts" # Ц
135
+ sub "Ч", "Ç" # Ч => Ç
136
+ sub "Ш", "Ş" # Ш => Ş
137
+ sub "Щ", "ŞÇ" # Щ
138
+ sub "Ъ", "" # Ъ
139
+ sub "Ы", "I" # Ы => I note[2] note[6]
140
+ sub "Ь", "’" # Ь => ’
141
+ sub "Э", "E" # Э note[7]
142
+ sub "Ю", "Yu" # Ю note[3] note[8]
143
+ sub "Я", "Ya" # Я note[3] note[8]
144
+
145
+ sub "\u0430", "a" # а
146
+ sub "\u04D9", any("əä") # ә => [ə, ä] note[1]
147
+ sub "\u0431", "b" # б
148
+ sub "\u0432", any("wv") # в note[2]
149
+ sub "\u0433", "ğ" # г => ğ note[3]
150
+ sub "\u0434", "d" # д
151
+ sub "\u0435", "e" # e note[3] note[4]
152
+ sub "\u0436", "j" # ж
153
+ sub "\u0497", "c" # җ
154
+ sub "\u0437", "z" # з
155
+ sub "\u0438", "i" # и
156
+ sub "\u0439", "y" # й
157
+ sub "\u043A", "q" # к note[3]
158
+ sub "\u043B", "l" # л
159
+ sub "\u043C", "m" # м
160
+ sub "\u043D", "n" # н
161
+ sub "\u04A3", any("ꞑñ") # ң => [ꞑ, ñ] note[1]
162
+ sub "\u043E", "o" # о
163
+ sub "\u04E9", any("oö") # ө => [o, ö] note[1]
164
+ sub "\u043F", "p" # п
165
+ sub "\u0440", "r" # р
166
+ sub "\u0441", "s" # с
167
+ sub "\u0442", "t" # т
168
+ sub "\u0443", "u" # у note[5]
169
+ sub "\u04AF", "ü" # ү => ü note[5]
170
+ sub "\u0444", "f" # ф
171
+ sub "\u0445", "x" # х
172
+ sub "\u04BB", "h" # һ
173
+ sub "\u0446", "ts" # ц
174
+ sub "\u0447", "ç" # ч => ç
175
+ sub "\u0448", "ş" # ш => ş
176
+ sub "\u0449", "şç" # щ => şç
177
+ sub "ъ", "" # ъ
178
+ sub "\u044B", "ı" # ы => ı note[2] note[6]
179
+ sub "ь", "’" # ь => ’
180
+ sub "\u044D", "e" # э note[7]
181
+ sub "\u044E", "yu" # ю note[3] note[8]
182
+ sub "\u044F", "ya" # я note[3] note[8]
183
+ }
184
+
185
+ }
@@ -0,0 +1,188 @@
1
+ metadata {
2
+ authority_id: bgnpcgn
3
+ id: 1994
4
+ language: iso-639-2:tgk
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: BGN/PCGN Romanization System -- Tajik (1994)
8
+ url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20TAJIK.pdf
9
+ creation_date: 1994
10
+ confirmation_date: 2017-11
11
+ description: |
12
+ The BGN/PCGN system for Tajik was designed for use in romanizing names written in the Tajik Cyrillic alphabet.
13
+ The Tajik Cyrillic alphabet contains six characters not present in the Russian alphabet: ғ, ӣ, қ, ӯ, ҳ and ҷ. An
14
+ orthographic reform of the Tajik Cyrillic alphabet was implemented under the auspices of the Academy of Sciences of
15
+ Tajikistan. This reform was promulgated in a decree of 3 September 1998 by the government of the Republic of
16
+ Tajikistan. The reform abolished the characters ц, щ, ь and ы (see notes 2 through 5).
17
+
18
+ notes:
19
+ - |
20
+ The character sequences гҳ , зҳ , кҳ , and сҳ may be romanized g·h, z·h, k·h, and s·h in order
21
+ to differentiate those romanizations from the digraphs gh, zh, kh, and sh which are used to
22
+ render the characters ғ, ж, x, and ш.
23
+ - |
24
+ The obsolete character ц, abolished in 1998, should be romanized s (before a vowel and/or
25
+ after a consonant within a word) or ts intervocalically.
26
+ - The obsolete character щ, replaced by ш in 1998, should be romanized sh.
27
+ - The obsolete character ь, abolished in 1998, should not be romanized.
28
+ - The obsolete character ы, replaced by и in 1998, should be romanized i.
29
+ - Unicode values are shown with the uppercase Cyrillic character first, followed by the lowercase character.
30
+ - |
31
+ An inventory of letter-diacritic combinations, with their Unicode encoding, in addition to the
32
+ unmodified letters of the basic Roman script is:
33
+ All apostrophes appearing in romanization are U+2019
34
+ Í (U+00CD) í (U+00ED)
35
+ Ŭ (U+016C) ŭ (U+016D)
36
+ Ė (U+0116) ė (U+0117)
37
+ - |
38
+ The Romanization column shows only lowercase forms but, when romanizing, uppercase and
39
+ lowercase Roman letters as appropriate should be used.
40
+ }
41
+
42
+ tests {
43
+ # https://ru.wikipedia.org/wiki/Таджикская_письменность#Образцы_записи
44
+ test "Тамоми одамон озод ба дунё меоянд ва аз лиҳози манзилату ҳуқуқ бо ҳам баробаранд.\nҲама соҳиби ақлу виҷдонанд, бояд нисбат ба якдигар бародарвор муносабат намоянд.", "Tamomi odamon ozod ba dunyo meoyand va az lihozi manzilatu huquq bo ham barobarand.\nHama sohibi aqlu vijdonand, boyad nisbat ba yakdigar barodarvor munosabat namoyand."
45
+ test "Баниодам аъзои як пайкаранд, ки дар офариниш зи як гавҳаранд. Чу узве ба дард оварад рӯзгор, дигар узвҳоро намонад қарор.", "Baniodam a’zoi yak paykarand, ki dar ofarinish zi yak gavharand. Chu uzve ba dard ovarad rŭzgor, digar uzvhoro namonad qaror."
46
+ test "Саъдӣ", "Sa’dí"
47
+ test "Мурда будам, зинда шудам; гиря будам, xанда шудам. Давлати ишқ омаду ман давлати поянда шудам.", "Murda budam, zinda shudam; girya budam, xanda shudam. Davlati ishq omadu man davlati poyanda shudam."
48
+ test "Мавлавӣ", "Mavlaví"
49
+ test "санг", "sang"
50
+ test "барг", "barg"
51
+ test "номвар", "nomvar"
52
+ test "Бағдод", "Baghdod"
53
+ test "ғор", "ghor"
54
+ test "модар", "modar"
55
+ test "меравам", "meravam"
56
+ test "дарё", "daryo"
57
+ test "осиёб", "osiyob"
58
+ test "жола", "zhola"
59
+ test "каждум", "kazhdum"
60
+ test "баъз", "ba’z"
61
+ test "назар", "nazar"
62
+ test "заҳоб", "zahob"
63
+ test "ихтиёр", "ikhtiyor"
64
+ test "зебоӣ", "zeboí"
65
+ test "май", "may"
66
+ test "кадом", "kadom"
67
+ test "қадам", "qadam"
68
+ test "лола", "lola"
69
+ test "мурдагӣ", "murdagí"
70
+ test "нон", "non"
71
+ test "орзу", "orzu"
72
+ test "панҷ", "panj"
73
+ test "ранг", "rang"
74
+ test "сар", "sar"
75
+ test "субҳ", "subh"
76
+ test "сурайё", "surayyo"
77
+ test "тоҷик", "tojik"
78
+ test "талаб", "talab"
79
+ test "дуд", "dud"
80
+ test "хӯрдан", "khŭrdan"
81
+ test "фурӯғ", "furŭgh"
82
+ test "хондан", "khondan"
83
+ test "ҳофиз", "hofiz"
84
+ test "чӣ", "chí"
85
+ test "ҷанг", "jang"
86
+ test "шаб", "shab"
87
+ test "таъриф", "ta’rif"
88
+ test "эй", "ėy"
89
+ test "июн", "iyun"
90
+ test "ягонагӣ", "yagonagí"
91
+ test "РАМЗҲО", "RAMZ·HO"
92
+ }
93
+
94
+ stage {
95
+
96
+ # RULES
97
+ # note[1]
98
+ sub "\u04B3", "·h", before: any("ГгЗзКкСс")
99
+ sub "\u04B2", "·H", before: any("ГгЗзКкСс")
100
+ # note[2]
101
+ sub "\u0426", "S", after: any("АаЕеЁёИиОоУуЫыЭэЮюЯя")
102
+ sub "\u0446", "s", after: any("АаЕеЁёИиОоУуЫыЭэЮюЯя")
103
+
104
+
105
+ # CHARACTERS
106
+ parallel {
107
+ sub "А", "A" # А
108
+ sub "Б", "B" # Б
109
+ sub "В", "V" # В
110
+ sub "Г", "G" # Г
111
+ sub "Ғ", "Gh" # Ғ
112
+ sub "Д", "D" # Д
113
+ sub "Е", "E" # Е
114
+ sub "Ё", "Yo" # Ё
115
+ sub "Ж", "Zh" # Ж
116
+ sub "З", "Z" # З
117
+ sub "И", "I" # И
118
+ sub "Ӣ", "Í" # Ӣ => Í
119
+ sub "Й", "Y" # Й
120
+ sub "К", "K" # К
121
+ sub "Қ", "Q" # Қ
122
+ sub "Л", "L" # Л
123
+ sub "М", "M" # М
124
+ sub "Н", "N" # Н
125
+ sub "О", "O" # О
126
+ sub "П", "P" # П
127
+ sub "Р", "R" # Р
128
+ sub "С", "S" # С
129
+ sub "Т", "T" # Т
130
+ sub "У", "U" # У
131
+ sub "Ӯ", "Ŭ" # Ӯ => Ŭ
132
+ sub "Ф", "F" # Ф
133
+ sub "Х", "Kh" # Х
134
+ sub "Ҳ", "H" # Ҳ
135
+ sub "Ч", "Ch" # Ч
136
+ sub "Ҷ", "J" # Ҷ
137
+ sub "Ц", "Ts" # Ц note[2]
138
+ sub "Ш", "Sh" # Ш
139
+ sub "Щ", "Sh" # Щ note[3]
140
+ sub "Ъ", "’" # Ъ
141
+ sub "Ы", "I" # Ы note[5]
142
+ sub "Ь", "" # Ь note[4]
143
+ sub "Э", "Ė" # Э => Ė
144
+ sub "Ю", "Yu" # Ю
145
+ sub "Я", "Ya" # Я
146
+
147
+ sub "а", "a" # а
148
+ sub "б", "b" # б
149
+ sub "в", "v" # в
150
+ sub "г", "g" # г
151
+ sub "ғ", "gh" # ғ
152
+ sub "д", "d" # д
153
+ sub "е", "e" # e
154
+ sub "ё", "yo" # ё
155
+ sub "ж", "zh" # ж
156
+ sub "з", "z" # з
157
+ sub "и", "i" # и
158
+ sub "ӣ", "í" # ӣ => í
159
+ sub "й", "y" # й
160
+ sub "к", "k" # к
161
+ sub "қ", "q" # қ
162
+ sub "л", "l" # л
163
+ sub "м", "m" # м
164
+ sub "н", "n" # н
165
+ sub "о", "o" # о
166
+ sub "п", "p" # п
167
+ sub "р", "r" # р
168
+ sub "с", "s" # с
169
+ sub "т", "t" # т
170
+ sub "у", "u" # у
171
+ sub "ӯ", "ŭ" # ӯ => ŭ
172
+ sub "ф", "f" # ф
173
+ sub "х", "kh" # х
174
+ sub "ҳ", "h" # ҳ
175
+ sub "ч", "ch" # ч
176
+ sub "ҷ", "j" # ҷ
177
+ sub "ц", "ts" # ц note[2]
178
+ sub "ш", "sh" # ш
179
+ sub "щ", "sh" # щ note[3]
180
+ sub "ъ", "’" # ъ
181
+ sub "ы", "i" # ы note[5]
182
+ sub "ь", "" # ь note[4]
183
+ sub "э", "ė" # э => ė
184
+ sub "ю", "yu" # ю
185
+ sub "я", "ya" # я
186
+ }
187
+
188
+ }