interscript-maps 2.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (291) hide show
  1. checksums.yaml +7 -0
  2. data/README.adoc +28 -0
  3. data/interscript-maps.gemspec +28 -0
  4. data/interscript-maps.yaml +235 -0
  5. data/libs/posix.iml +11 -0
  6. data/libs/unicode.iml +13 -0
  7. data/libs/var-Cyrl.iml +7 -0
  8. data/libs/var-kor.iml +17 -0
  9. data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
  10. data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
  11. data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
  12. data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
  13. data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
  14. data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
  21. data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
  22. data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
  23. data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
  24. data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
  25. data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
  26. data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
  27. data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
  28. data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
  29. data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
  30. data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
  31. data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
  32. data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
  33. data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
  34. data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
  35. data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
  36. data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
  37. data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
  38. data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
  39. data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
  40. data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
  41. data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
  42. data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
  43. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
  44. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
  45. data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
  46. data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
  47. data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
  48. data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
  49. data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
  50. data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
  51. data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
  52. data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
  53. data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
  54. data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
  55. data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
  56. data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
  57. data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
  58. data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
  59. data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
  60. data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
  61. data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
  62. data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
  63. data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
  64. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
  65. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
  66. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
  67. data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
  68. data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
  69. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
  70. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
  71. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
  72. data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
  73. data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
  74. data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
  75. data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
  76. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
  77. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
  78. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
  79. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
  80. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
  81. data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
  82. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
  83. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
  84. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
  85. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
  86. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
  87. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
  88. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
  89. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
  90. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
  91. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
  92. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
  93. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
  94. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
  95. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
  96. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
  97. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
  98. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
  99. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
  100. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
  101. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
  102. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
  103. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
  104. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
  105. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
  106. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
  107. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
  108. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
  109. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
  110. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
  111. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
  112. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
  113. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
  114. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
  115. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
  116. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
  117. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
  118. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
  119. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
  120. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
  121. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
  122. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
  123. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
  124. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
  125. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
  126. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
  127. data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
  128. data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
  129. data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
  130. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
  131. data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
  132. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
  133. data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
  134. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
  135. data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
  136. data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
  137. data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
  138. data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
  139. data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
  140. data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
  141. data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
  142. data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
  143. data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
  144. data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
  145. data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
  146. data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
  147. data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
  148. data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
  149. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
  150. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
  151. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
  152. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
  153. data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
  154. data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
  155. data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
  156. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
  157. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
  158. data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
  159. data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
  160. data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
  161. data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
  162. data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
  163. data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
  164. data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
  165. data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
  166. data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
  167. data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
  168. data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
  169. data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
  170. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
  171. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
  172. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
  173. data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
  174. data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
  175. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
  176. data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
  177. data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
  178. data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
  179. data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
  180. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
  181. data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
  182. data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
  183. data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
  184. data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
  185. data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
  186. data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
  187. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
  188. data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
  189. data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
  190. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
  191. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
  192. data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
  193. data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
  194. data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
  195. data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
  196. data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
  197. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
  198. data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
  199. data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
  200. data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
  201. data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
  202. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
  203. data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
  204. data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
  205. data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
  206. data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
  207. data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
  208. data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
  209. data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
  210. data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
  211. data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
  212. data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
  213. data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
  214. data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
  215. data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
  216. data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
  217. data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
  218. data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
  219. data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
  220. data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
  221. data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
  222. data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
  223. data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
  224. data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
  225. data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
  226. data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
  227. data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
  228. data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
  229. data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
  230. data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
  231. data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
  232. data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
  233. data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
  234. data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
  235. data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
  236. data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
  237. data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
  238. data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
  239. data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
  240. data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
  241. data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
  242. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
  243. data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
  244. data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
  245. data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
  246. data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
  247. data/maps/un-ara-Arab-Latn-1971.imp +137 -0
  248. data/maps/un-ara-Arab-Latn-1972.imp +155 -0
  249. data/maps/un-ara-Arab-Latn-2017.imp +375 -0
  250. data/maps/un-asm-Beng-Latn-1972.imp +188 -0
  251. data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
  252. data/maps/un-ben-Beng-Latn-2016.imp +516 -0
  253. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
  254. data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
  255. data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
  256. data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
  257. data/maps/un-hin-Deva-Latn-2016.imp +356 -0
  258. data/maps/un-kan-Kana-Latn-2016.imp +214 -0
  259. data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
  260. data/maps/un-mar-Deva-Latn-2016.imp +96 -0
  261. data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
  262. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
  263. data/maps/un-nep-Deva-Latn-1972.imp +295 -0
  264. data/maps/un-nep-Deva-Latn-2013.imp +62 -0
  265. data/maps/un-ori-Orya-Latn-1972.imp +208 -0
  266. data/maps/un-pan-Guru-Latn-1972.imp +321 -0
  267. data/maps/un-prs-Arab-Latn-1967.imp +214 -0
  268. data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
  269. data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
  270. data/maps/un-tam-Taml-Latn-1972.imp +173 -0
  271. data/maps/un-tel-Telu-Latn-1972.imp +229 -0
  272. data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
  273. data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
  274. data/maps/un-urd-Arab-Latn-1972.imp +290 -0
  275. data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
  276. data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
  277. data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
  278. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
  279. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
  280. data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
  281. data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
  282. data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
  283. data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
  284. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
  285. data/maps/var-mon-Mong-Latn-1930.imp +101 -0
  286. data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
  287. data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
  288. data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
  289. data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
  290. data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
  291. metadata +335 -0
@@ -0,0 +1,151 @@
1
+ metadata {
2
+ authority_id: odni
3
+ id: 2015
4
+ language: iso-639-2:uig
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Standards for the transliteration of uyghur personal names in written reports and products
8
+ source: ICS-630-01 Annex U
9
+ creation_date: 2015
10
+ confirmation_date: 2015
11
+ description: |
12
+ This system is the Intelligence Community standard for the transliteration of Uyghur person names
13
+ that will be applied to all final written reports and products for IC consumers. It is not
14
+ intended to eliminate variations of a name that can contribute forensic information. Rather, it is
15
+ to provide an IC standard Romanized (English) transliteration from Uyghur that can then be linked
16
+ to forensic information in ways that will help identify the referent of the name.
17
+
18
+ In cases where an individual’s name has already been transliterated in a variant spelling, the IC
19
+ Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the
20
+ first usage. In addition, if the original Cyrillic-script or Arabic-script spelling is known, that
21
+ spelling should also appear in parentheses following the name, if possible, following best
22
+ practices of the issuing organization and taking into consideration information system capabilities.
23
+ For example: Zordun Sabir (also seen as Zordun Sabeer, Зордун Сабир ,زوردون سابیر). This convention
24
+ is designed to ensure that vital forensic information is not lost.
25
+
26
+ For names of persons who are known to not be part of the Uyghur-speaking community, use the relevant
27
+ IC transliteration standard for names from that language (e.g., Yitzhak). A translator’s note may be
28
+ used to clarify the known origin of the person. Spell names of individuals from languages that are
29
+ written in Roman letters as they are spelled in those languages (e.g., George Clooney, Jorge Garcia,
30
+ Georges Pompidou).
31
+
32
+ In the case of active senior government officials in the on-line CIA World Factbook and the on-line
33
+ directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings given in
34
+ these on-line reference works should be used in place of the IC Standard. For any individual who has
35
+ at one time been listed in the Factbook or Chiefs of State directory but who no longer appears in
36
+ those resources (i.e. is no longer a government official), the IC Standard spelling should appear
37
+ first, with the spelling, if known, as it previously appeared in those resources listed within
38
+ parentheses at the first usage.
39
+
40
+ The primary goal is to produce a consistent Romanized transcription of names that is specifically
41
+ readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
42
+ (English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use of
43
+ diacritics. However, within the context of a report, where additional information about the
44
+ individual is provided, the referent will be clearly identified. This system will be used in
45
+ conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
46
+ names of well-known individuals.
47
+
48
+ notes:
49
+ - Transliterate double digraphs as a single digraph, i.e. шш -> sh, not shsh
50
+ - In the Roman, no distinction is made between digraphs such as 'sh' and single contiguous letters,
51
+ (e.g. 's' followed by 'h').
52
+ - The Cyrillic ъ and ь are not transliterated, but instead are left out of the transliteration.
53
+ }
54
+
55
+ tests {
56
+ test "Зордун Сабир", "Zordun Sabir"
57
+ }
58
+
59
+ stage {
60
+
61
+ # RULES
62
+ # note[1]
63
+ # generated with: "ҒЁҖҢЧШЮЯ".split("").each { |i| puts %{sub capture(any("#{i}#{i.downcase}"))+any("#{i}#{i.downcase}"), ref(1)} }
64
+ sub capture(any("Ғғ"))+any("Ғғ"), ref(1)
65
+ sub capture(any("Ёё"))+any("Ёё"), ref(1)
66
+ sub capture(any("Җҗ"))+any("Җҗ"), ref(1)
67
+ sub capture(any("Ңң"))+any("Ңң"), ref(1)
68
+ sub capture(any("Чч"))+any("Чч"), ref(1)
69
+ sub capture(any("Шш"))+any("Шш"), ref(1)
70
+ sub capture(any("Юю"))+any("Юю"), ref(1)
71
+ sub capture(any("Яя"))+any("Яя"), ref(1)
72
+ # note[3]
73
+ sub any("\u044A\u044C"), none
74
+
75
+
76
+ # CHARACTERS
77
+ parallel {
78
+ sub "\u0410", "A" # А
79
+ sub "\u04D8", "E" # Ә
80
+ sub "\u0411", "B" # Б
81
+ sub "\u0412", "W" # В
82
+ sub "\u0413", "G" # Г
83
+ sub "\u0492", "Gh" # Ғ
84
+ sub "\u0414", "D" # Д
85
+ sub "\u0415", "E" # Е
86
+ sub "\u0401", "Yo" # Ё
87
+ sub "\u0416", "J" # Ж
88
+ sub "\u0496", "Zh" # Җ
89
+ sub "\u0417", "Z" # З
90
+ sub "\u0418", "I" # И
91
+ sub "\u0419", "Y" # Й
92
+ sub "\u041A", "K" # К
93
+ sub "\u049A", "Q" # Қ
94
+ sub "\u041B", "L" # Л
95
+ sub "\u041C", "M" # М
96
+ sub "\u041D", "N" # Н
97
+ sub "\u04A2", "Ng" # Ң
98
+ sub "\u041E", "O" # О
99
+ sub "\u04E8", "O" # Ө
100
+ sub "\u041F", "P" # П
101
+ sub "\u0420", "R" # Р
102
+ sub "\u0421", "S" # С
103
+ sub "\u0422", "T" # Т
104
+ sub "\u0423", "U" # У
105
+ sub "\u04AE", "U" # Ү
106
+ sub "\u0424", "F" # Ф
107
+ sub "\u0425", "X" # Х
108
+ sub "\u04BA", "H" # Һ
109
+ sub "\u0427", "Ch" # Ч
110
+ sub "\u0428", "Sh" # Ш
111
+ sub "\u042E", "Yu" # Ю
112
+ sub "\u042F", "Ya" # Я
113
+
114
+ sub "\u0430", "a" # а
115
+ sub "\u04D9", "e" # ә
116
+ sub "\u0431", "b" # б
117
+ sub "\u0432", "w" # в
118
+ sub "\u0433", "g" # г
119
+ sub "\u0493", "gh" # ғ
120
+ sub "\u0434", "d" # д
121
+ sub "\u0435", "e" # e
122
+ sub "\u0451", "yo" # ё
123
+ sub "\u0436", "j" # ж
124
+ sub "\u0497", "zh" # җ
125
+ sub "\u0437", "z" # з
126
+ sub "\u0438", "i" # и
127
+ sub "\u0439", "y" # й
128
+ sub "\u043A", "k" # к
129
+ sub "\u049B", "q" # қ
130
+ sub "\u043B", "l" # л
131
+ sub "\u043C", "m" # м
132
+ sub "\u043D", "n" # н
133
+ sub "\u04A3", "ng" # ң
134
+ sub "\u043E", "o" # о
135
+ sub "\u04E9", "o" # ө
136
+ sub "\u043F", "p" # п
137
+ sub "\u0440", "r" # р
138
+ sub "\u0441", "s" # с
139
+ sub "\u0442", "t" # т
140
+ sub "\u0443", "u" # у
141
+ sub "\u04AF", "u" # ү
142
+ sub "\u0444", "f" # ф
143
+ sub "\u0445", "x" # х
144
+ sub "\u04BB", "h" # һ
145
+ sub "\u0447", "ch" # ч
146
+ sub "\u0448", "sh" # ш
147
+ sub "\u044E", "yu" # ю
148
+ sub "\u044F", "ya" # я
149
+ }
150
+
151
+ }
@@ -0,0 +1,136 @@
1
+ metadata {
2
+ authority_id: odni
3
+ id: 2015
4
+ language: iso-639-2:ukr
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Office of the Director Of National Intelligence Ukrainian Personal Names 2004 System, ICS 630-01 Annex M
8
+
9
+ # url:
10
+ source: ICS 630-01, Annex M
11
+ creation_date: 2015
12
+ confirmation_date: 2015
13
+ description: |
14
+ This system is the Intelligence Community (IC) standard for the
15
+ transliteration of Ukrainian names that will be applied to all final
16
+ written reports and products for IC consumers. It is not intended to
17
+ eliminate variations of a name that can contribute forensic
18
+ information. Rather, it is to provide an IC standard Romanized
19
+ (English) transliteration from Ukrainian that can then be linked to
20
+ forensic information in ways that will help identify the referent of
21
+ the name.
22
+ }
23
+
24
+ tests {
25
+ test "Андрій", "Andriy"
26
+ test "Борисенко", "Borysenko"
27
+ test "Володимир", "Volodymyr"
28
+ test "Богдан", "Bohdan"
29
+ test "Згурський", "Zhurskyy"
30
+ test "Дмитро", "Dmytro"
31
+ test "Олег", "Oleh"
32
+ test "Гаєвич", "Hayevych"
33
+ test "Жанна", "Zhanna"
34
+ test "Казимирчук", "Kazymyrchuk"
35
+ test "Михайленко", "Mykhaylenko"
36
+ test "Іващенко", "Ivashchenko"
37
+ test "Олексій", "Oleksiy"
38
+ test "Коваленко", "Kovalenko"
39
+ test "Леонід", "Leonid"
40
+ test "Маринич", "Marynych"
41
+ test "Наталія", "Nataliya"
42
+ test "Онищенко", "Onyshchenko"
43
+ test "Петро", "Petro"
44
+ test "Рибчинський", "Rybchynskyy"
45
+ test "Соломія", "Solomiya"
46
+ test "Троць", "Trots"
47
+ test "Уляна", "Ulyana"
48
+ test "Філіпчук", "Filipchuk"
49
+ test "Христина", "Khrystyna"
50
+ test "Стеценко", "Stetsenko"
51
+ test "Шевченко", "Shevchenko"
52
+ test "Гаращенко", "Harashchenko"
53
+ test "Юрій", "Yuriy"
54
+ test "Ярошенко", "Yaroshenko"
55
+ test "Костянтин", "Kostyantyn"
56
+ test "Новофедорівка", "Novofedorivka"
57
+ test "Гуляйгородок", "Hulyayhorodok"
58
+ }
59
+
60
+ stage {
61
+
62
+ # RULES
63
+ sub boundary+"\u2019"+boundary, none # remove ’
64
+
65
+
66
+ # CHARACTERS
67
+ parallel {
68
+ sub "А", "A" # А
69
+ sub "Б", "B" # Б
70
+ sub "В", "V" # В
71
+ sub "Г", "H" # Г
72
+ sub "Ґ", "G" # Ґ
73
+ sub "Д", "D" # Д
74
+ sub "Е", "E" # Е
75
+ sub "Є", "Ye" # Є
76
+ sub "Ж", "Zh" # Ж
77
+ sub "З", "Z" # З
78
+ sub "И", "Y" # И
79
+ sub "І", "I" # І
80
+ sub "Ї", "Yi" # Ї
81
+ sub "Й", "Y" # Й
82
+ sub "К", "K" # К
83
+ sub "Л", "L" # Л
84
+ sub "М", "M" # М
85
+ sub "Н", "N" # Н
86
+ sub "О", "O" # О
87
+ sub "П", "P" # П
88
+ sub "Р", "R" # Р
89
+ sub "С", "S" # С
90
+ sub "Т", "T" # Т
91
+ sub "У", "U" # У
92
+ sub "Ф", "F" # Ф
93
+ sub "Х", "Kh" # Х
94
+ sub "Ц", "Ts" # Ц
95
+ sub "Ч", "Ch" # Ч
96
+ sub "Ш", "Sh" # Ш
97
+ sub "Щ", "Shch" # Щ
98
+ sub "Ю", "Yu" # Ю
99
+ sub "Я", "Ya" # Я
100
+ sub "Ь", "" # Ь
101
+ sub "а", "a" # а
102
+ sub "б", "b" # б
103
+ sub "в", "v" # в
104
+ sub "г", "h" # г
105
+ sub "ґ", "g" # ґ
106
+ sub "д", "d" # д
107
+ sub "е", "e" # е
108
+ sub "є", "ye" # є
109
+ sub "ж", "zh" # ж
110
+ sub "з", "z" # з
111
+ sub "и", "y" # и
112
+ sub "і", "i" # і
113
+ sub "ї", "yi" # ї
114
+ sub "й", "y" # й
115
+ sub "к", "k" # к
116
+ sub "л", "l" # л
117
+ sub "м", "m" # м
118
+ sub "н", "n" # н
119
+ sub "о", "o" # о
120
+ sub "п", "p" # п
121
+ sub "р", "r" # р
122
+ sub "с", "s" # с
123
+ sub "т", "t" # т
124
+ sub "у", "u" # у
125
+ sub "ф", "f" # ф
126
+ sub "х", "kh" # х
127
+ sub "ц", "ts" # ц
128
+ sub "ч", "ch" # ч
129
+ sub "ш", "sh" # ш
130
+ sub "щ", "shch" # щ
131
+ sub "ю", "yu" # ю
132
+ sub "я", "ya" # я
133
+ sub "ь", "" # Ь
134
+ }
135
+
136
+ }
@@ -0,0 +1,220 @@
1
+ metadata {
2
+ authority_id: odni
3
+ id: 2015
4
+ language: iso-639-2:urd
5
+ source_script: Arab
6
+ destination_script: Latn
7
+ name: Office of the Director Of National Intelligence Hindi Urdu Personal Names 2015 System, ICS-630-01 Annex F
8
+
9
+ #url:
10
+ creation_date: 2015
11
+ confirmation_date: 2015
12
+ description: |
13
+ This system is the Intelligence Community (IC) standard for the transliteration of names
14
+ from Hindi and Urdu that will be applied to all final written reports and products for IC
15
+ consumers. It is not intended to eliminate variations of a name that can contribute
16
+ forensic information. Rather, it is to provide an IC standard Romanized (English)
17
+ transliteration from standard Hindi and Urdu that can then be linked to forensic
18
+ information in ways that will help identify the referent of the name.
19
+
20
+ There are typically a number of ways that names can be Romanized from either
21
+ Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
22
+ Romanization of Hindi and Urdu names for several reasons, including the fact that some
23
+ sounds in South Asian languages (e.g., retroflex consonants, voiced aspirates) have no
24
+ equivalent in English or other European languages. In the case of Urdu, as in the original
25
+ Arabic source of many Islamic names, short vowel markings, double consonant marks
26
+ and other diacritics that would clearly distinguish the name are almost always omitted
27
+ from standard written texts. And many Islamic names of Arabic or Persian origin reflect
28
+ spelling distinctions from those languages that are lost in modern Urdu pronunciation
29
+ (e.g., three distinct Arabic letters all represent the identical sound [s] for Urdu speakers);
30
+ transliterations might either maintain those spelling distinctions or ignore them entirely.
31
+ And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
32
+ anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
33
+ transliterations may either reflect spelling or pronunciation in such cases.
34
+
35
+ Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
36
+ Urdu transliterations as much as possible. In the area of names, this can become
37
+ problematic when the Urdu spelling accurately reflects original Arabic spelling while the
38
+ Hindi spelling was phonetically-based, in essence, already a transliteration. This would
39
+ argue for ignoring Arabic/Urdu spelling distinctions not reflected in pronunciation in
40
+ either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
41
+ spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
42
+ However, this is not always possible (see Hindi va versus Urdu wau).
43
+
44
+ In cases where an individual’s name has already been transliterated, that is to be indicated
45
+ – as found – in parentheses immediately following its rendition in the transliteration
46
+ standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
47
+ Devanagari or Arabic-script spelling is known, that spelling should also appear in
48
+ parentheses following the name, if possible, following best practices of the issuing
49
+ organization and taking into consideration information system capabilities. This
50
+ convention is designed to ensure that vital forensic information is not lost.
51
+
52
+ For names of persons who are known to not be part of the Hindi- or Urdu-speaking
53
+ community, use the relevant IC transliteration standard for names from that language
54
+ (e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
55
+ the person. Spell names of individuals from languages that are written in Roman letters as
56
+ they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
57
+ Pompidou).
58
+
59
+ In the case of active senior government officials in the on-line CIA World Factbook and
60
+ the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
61
+ the spellings given in these on-line reference works should be used in place of the IC
62
+ Standard. For any individual who has at one time been listed in the Factbook or Chiefs of
63
+ State directory but who no longer appears in those resources (i.e. is no longer a
64
+ government official), the IC Standard spelling should appear first, with the spelling, if
65
+ known, as it previously appeared in those resources listed within parentheses at the first
66
+ usage.
67
+
68
+ The primary goal of this system is to produce a consistent Romanized transcription of the
69
+ name that is readable to the non-specialist. The system uses the 26 letters of the standard
70
+ (English) Roman alphabet. Some ambiguities in the Romanized form will occur without
71
+ the use of diacritics. However, within the context of a report, where additional
72
+ information about the individual is provided, the referent will be clearly identified.
73
+ Additionally, this system will be used in conjunction with on-line tools, name dictionaries
74
+ and lists containing conventional spellings of names of well-known individuals
75
+
76
+ notes:
77
+
78
+ - |
79
+ Long/Short Vowels: Long and short vowels are not distinguished in the system:
80
+ The borrowed Arabic name Samir could represent two distinct names, one with a
81
+ long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
82
+ /ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
83
+ distinguish between these.
84
+
85
+ - |
86
+ No distinction is made between: retroflex and non-retroflex consonants; and
87
+ nasalized vowels and vowels followed by /n/.
88
+ - |
89
+ No distinction is made between the several Arabic letters with the same phonetic
90
+ value in Urdu: e.g., letters sin/svad, zal/ze/zoe.
91
+ - |
92
+ A distinction is drawn between Urdu letters qaf and kaf (and correspondingly,
93
+ Hindi qa and ka).
94
+ - |
95
+ A distinction is drawn between aspirated (e.g., /d/) and nonaspirated consonants
96
+ (e.g., /dh/), with the exception of ch/chh, both represented by /ch/.
97
+ - |
98
+ Double consonants: Double consonants represented by the tashdid (shaddah) are
99
+ shown in most cases (e.g., Hassan, Muhammad). Exceptions: consonants
100
+ represented by digraphs are not doubled (e.g., Mubashir [not Mubashshir]).
101
+ - |
102
+ Hamzah (glottal stop) and ayn: Unlike in the Arabic IC Standard, these are not
103
+ represented in the IC standard.
104
+ - |
105
+ Digraphs: No distinction is made between digraphs such as /sh/ and single
106
+ contiguous letters such as /s/ followed by /h/.
107
+ - |
108
+ Arabic definite article “al” (‘the’): Shows sun letter assimilation in the
109
+ Romanized form (e.g., Abdur Rahman rather than Abdal Rahman, rather than
110
+ Arabic IC standard 'Abd al-Rahman).
111
+ - |
112
+ Special Rules
113
+ - |
114
+ Hyphens: Hyphens (-) are NOT used to connect name elements within a name:
115
+ Abdur Rahman. The single exception to this is the izafat (i.e., linking vowel in
116
+ noun-link-modifier construction of Persian origin), which does show a hyphen
117
+ before the /e/ and a following space: Koh-e Nur (‘mountain of light’), “Jaish-e
118
+ xx” (‘Army of xx’ construction).
119
+ - |
120
+ Names incorporating “din” are written as one unit: Azermuddin, Badruddin,
121
+ Faizuddin, Salahuddin.
122
+ - |
123
+ Names that incorporate Allah as part of the name show the Arabic grammatical
124
+ marker /u/ rather than the /a/ of Allah: Abdullah (not Abdallah).
125
+ - |
126
+ Inherent short vowel /a/ in Devanagari is represented with an /a/ in Roman. Final
127
+ consonants are assumed not to have a short /a/ (e.g., masc. name Ram Lal, not
128
+ Rama Lala).
129
+ - |
130
+ As a general rule, Devanagari va is transcribed as a /v/: Vijay, Vishal, etc.
131
+ Exception: /sw/ combination: Saraswati, Krishnaswami. Urdu wau, however, is
132
+ transcribed as /w/: Wasim, Walid.
133
+ }
134
+
135
+ tests {
136
+ test "وشال ٹھاکر", "ishal tsakr"
137
+ test "حسن محمود", "hasn mhamid"
138
+ test "یوسف خان", "iisf khan"
139
+ test "معین خان", "mein khan"
140
+ test "سعید اجمل", "seid ajml"
141
+ test "انضمام الحق", "anzmam alhaq"
142
+ test "فرہاد رضا", "frahad rza"
143
+ test "وسیم اکرام", "isim akram"
144
+ test "شکیب الحسن", "shkib alhasn"
145
+ test "حسن عبد اللہ", "hasn ebd allah"
146
+ }
147
+
148
+
149
+ stage {
150
+
151
+ # CHARACTERS
152
+ parallel {
153
+
154
+
155
+ sub "\u0622", "a" # ARABIC ALEF W/MADDA ABOVE
156
+ sub "\u0627", "a" # or u ARABIC ALEF
157
+ sub "\u06cc", "i" # or ai or u ARABIC LETTER WAW
158
+ sub "\u0648", "i" # or o,au ARABIC LETTER FARSI YEH
159
+ sub "\u06d2", "e" # ARABIC LETTER YEH BARREE
160
+ sub "\u0650", "e" # ARABIC ARABIC KASRA
161
+ sub "\u0639", "e" # ARABIC LETTER AIN
162
+ sub "\u06c1", "ah" # ARABIC LETTER HEH GOAL
163
+ sub "\u062d", "ha" # ARABIC LETTER HAH
164
+ sub "\u0648\u0670", "a" # ARABIC LETTER FARSI YEH + ARABIC LETTER SUPERSCRIPT ALEF
165
+ sub "\u0670", "a" # ARABIC LETTER SUPERSCRIPT ALEF
166
+ sub "\u0627\u0650", "i" # ARABIC ALEF + ARABIC KASRA
167
+ sub "\u0639\u0650", "i" # ARABIC LETTER AIN + ARABIC KASRA
168
+ sub "\u064f", "i" # ARABIC DAMMA
169
+ sub "\u06d3", "i" # ARABIC LETTER YEH BARREE WITH HAMZA ABOVE
170
+ sub "\u06c2", "-e" # ARABIC LETTER HEH GOAL WITH HAMZA ABOVE
171
+ sub "\u06c1\u0650", "o" # ARABIC LETTER YEH WITH HAMZA ABOVE
172
+ sub "\u0624", "au" # ARABIC LETTER WAW WITH HAMZA ABOVE
173
+
174
+
175
+
176
+ sub "\u06a9", "k" # ARABIC LETTER KEHEH
177
+ sub "\u0642", "q" # ARABIC LETTER QAF
178
+ sub "\u062e", "kh" # ARABIC LETTER KHAH
179
+ sub "\u06af", "g" # ARABIC LETTER GAF
180
+ sub "\u063a", "gh" # ARABIC LETTER GHAIN
181
+ sub "\u0686", "ch" # ARABIC LETTER TCHEH
182
+ sub "\u062c", "j" # Arabic Letter Jeem
183
+
184
+ sub "\u0632", "z" # Arabic Letter ZAIN
185
+ sub "\u0630", "z" # Arabic Letter THAL
186
+ sub "\u0636", "z" # Arabic Letter DAD
187
+ sub "\u0638", "z" # Arabic Letter ZAH
188
+ sub "\u0698", "zh" # Arabic Letter JEH
189
+
190
+
191
+ sub "\u0679", "t" # ARABIC LETTER TTEH
192
+ sub "\u0688", "d" # Arabic Letter DDAL
193
+ sub "\u062f", "d" # Arabic Letter DAL
194
+ sub "\u0691", "r" # Arabic Letter RREH
195
+ sub "\u062a", "t" # Arabic Letter TEH
196
+ sub "\u0637", "t" # Arabic Letter TAH
197
+ sub "\u0646", "n" # Arabic Letter NOON
198
+ sub "\u06ba", "n" # Arabic Letter NOON GHUNNA
199
+
200
+
201
+ sub "\u067e", "p" # Arabic Letter PE
202
+ sub "\u0641", "f" # Arabic Letter FEH
203
+ sub "\u0628", "b" # Arabic Letter BEH
204
+ sub "\u0645", "m" # Arabic Letter MEEM
205
+ sub "\u0631", "r" # Arabic Letter REH
206
+ sub "\u0644", "l" # Arabic Letter LAM
207
+ sub "\u0634", "sh" # Arabic Letter SHEEN
208
+ sub "\u0633", "s" # Arabic Letter SHEEN
209
+ sub "\u062b", "s" # Arabic Letter THEH
210
+ sub "\u0635", "s" # Arabic Letter SAD
211
+ sub "\u0621", "" # Arabic Letter HAMZA
212
+ sub "\u06be", "s" # Arabic Letter HEH DOACHASHMEE
213
+ sub "\u064b", "n" # Arabic Letter FATHATAN
214
+ sub "\u064e", "n" # Arabic sign FATHATAN
215
+ sub "\u0652", "" # Arabic Letter SUKUN
216
+ sub "\u0651", "" # Arabic Letter SHADDA
217
+ }
218
+
219
+ }
220
+