interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,274 @@
1
+ ---
2
+ authority_id: var
3
+ id: VPMC
4
+ language: iso-639-2:mon
5
+ source_script: Mong
6
+ destination_script: Latn
7
+ name: Transliteration Systems for Uyghur-Mongolian or Vertical or Old Script
8
+ url: https://collab.its.virginia.edu/wiki/tibetan-script/Transliteration%20Schemes%20for%20Mongolian%20Vertical%20Script.html
9
+ creation_date:
10
+ description: |
11
+ The only system for the Mongolian vertical script which is used commonly throughout
12
+ Mongolian studies worldwide is the Vladimirtsov-Mostaert system (V-M). The only
13
+ dictionary using this system is in an appendix to Antoine Mostaert’s Dictionnaire
14
+ ordos. Thus the Harvard Journal of Asiatic Studies specifies, “please use the written
15
+ Mongolian appendix to Antoine Mostaert’s Dictionnaire ordos. However, the V-M system
16
+ has many difficult diacriticals and non-Latin characters that constitute a significant
17
+ problem for editors and thus is difficult to recommend.
18
+
19
+ notes:
20
+ - A separated final form of vowels a or e is common, and can appear at the end
21
+ of a word, word stem, or suffix. This form requires a final-shaped preceding
22
+ consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
23
+ and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
24
+ with a hyphen. In digital typesetting, these forms are triggered by inserting
25
+ a U+180E ᠎ MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
26
+ and vowel.
27
+ - All case suffixes, as well as any plural suffixes consisting of one or two
28
+ syllables are likewise separated by a preceding and hyphen-transliterated gap.
29
+ In digital typesetting, this gap is represented by a U+202F   NARROW NO-BREAK SPACE
30
+ (HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
31
+ Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
32
+ as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
33
+ 'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
34
+ medial- (vowels), or variant-shaped form.
35
+
36
+ tests:
37
+ - source: ᠬ᠎ᠠ
38
+ expected: q-a
39
+ - source: ᠷ᠎ᠠ
40
+ expected: r-a
41
+ - source: ᠭᠠᠵᠠᠷ ᠠ
42
+ expected: γaǰar-a
43
+ - source: ᠡᠳᠦᠷ ᠡ
44
+ expected: edür-e
45
+ - source: ᠤᠯᠤᠰ ᠢ
46
+ expected: ulus-i
47
+ - source: ᠬᠥᠬᠡᠬᠣᠲᠠ # Хөх хот
48
+ expected: kökeqota
49
+ - source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
50
+ expected: ordos qota
51
+ - source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
52
+ expected: bayannaγur qota
53
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
54
+ expected: ulaγanqota
55
+ - source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
56
+ expected: qoolia γoul qota
57
+ - source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
58
+ expected: eriyen qota
59
+ - source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
60
+ expected: rasiyan qota
61
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
62
+ expected: baγarin baraγun qosiγu
63
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
64
+ expected: baγarin ǰegün qosiγu
65
+ - source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
66
+ expected: tüngliyou qota
67
+ - source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
68
+ expected: sili-yin qota
69
+ - source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
70
+ expected: qorin ger siyan
71
+ - source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
72
+ expected: uda toγoriγ
73
+ - source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
74
+ expected: üqai qota
75
+ - source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
76
+ expected: qayinan toγoriγ
77
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
78
+ expected: qayirub-un toqoi toγoriγ
79
+ - source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
80
+ expected: ulaγančab qota
81
+ - source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
82
+ expected: ǰining toγoriγ
83
+ - source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
84
+ expected: fvngǰve qota
85
+ - source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
86
+ expected: šangdu siyan
87
+ - source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
88
+ expected: liyangčang siyan
89
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
90
+ expected: čaqar baraγun γarun emünedü qosiγu
91
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
92
+ expected: čaqar baraγun γarun dumdadu qosiγu
93
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
94
+ expected: čaqar baraγun γarun qoyitu qosiγu
95
+ - source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
96
+ expected: dörbed qosiγu
97
+ - source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
98
+ expected: buγutu qota
99
+ - source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
100
+ expected: köndelen toγoriγ
101
+ - source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
102
+ expected: čingšan toγoriγ
103
+ - source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
104
+ expected: siγuyitu toγoriγ
105
+ - source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
106
+ expected: ǰiü yuvan toγoriγ
107
+ - source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
108
+ expected: güyang siyan
109
+ - source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
110
+ expected: tümed ǰegün qosiγu
111
+ - source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
112
+ expected: tümed baraγun qosiγu
113
+ - source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
114
+ expected: darqan muumingγ᠋an qolboγatu qosiγu
115
+ - source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
116
+ expected: kesiγten qosiγu
117
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
118
+ expected: sin-e barγu ǰegün qosiγu
119
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
120
+ expected: sin-e barγu baraγun qosiγu
121
+ - source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
122
+ expected: otoγ qosiγu
123
+ - source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
124
+ expected: dalad qosiγu
125
+ - source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
126
+ expected: ǰegünγar qosiγu
127
+ - source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
128
+ expected: otoγ-un emünedü qosiγu
129
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
130
+ expected: qangγin qosiγu
131
+ - source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
132
+ expected: üüsin qosiγu
133
+ - source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
134
+ expected: eǰin qoroγ-a qosiγu
135
+ - source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
136
+ expected: ǰalan ai᠌l qota
137
+ - source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
138
+ expected: yaγsi qota
139
+ - source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
140
+ expected: manǰuur qota
141
+ - source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
142
+ expected: qayilar toγoriγ
143
+ - source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
144
+ expected: qorčin toγoriγ
145
+ - source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
146
+ expected: kayilü siyan
147
+ - source: ᠬᠦᠷᠢᠶ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
148
+ expected: küriy-e qosiγu
149
+ - source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
150
+ expected: naiman qosiγu
151
+ - source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
152
+ expected: ǰarud qosiγu
153
+ - source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
154
+ expected: qorčin baraγun γarun dumdadu qosiγu
155
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
156
+ expected: qorčin ǰegün γarun dumdadu qosiγu
157
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
158
+ expected: qorčin ǰegün γarun qoyitu qosiγu
159
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
160
+ expected: ulaγanqada qota
161
+ - source: ᠰᠡᠷᠡᠴᠢ # Salaqi
162
+ expected: sereči
163
+ - source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
164
+ expected: gegen γoul qota
165
+ - source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
166
+ expected: alaša ǰegün qosiγu
167
+ - source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
168
+ expected: alaša baraγun qosiγu # Alaša Baraγun qosiγu
169
+ - source: ᠡᠵᠡᠨ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
170
+ expected: eǰen-e qosiγu
171
+ - source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
172
+ expected: köbegetü sir-a qosiγu
173
+ - source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
174
+ expected: üyuvan siyan
175
+ - source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
176
+ expected: üčuvan siyan
177
+ - source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
178
+ expected: tüčiuvan siyan
179
+ - source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
180
+ expected: linsi siyan
181
+ - source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
182
+ expected: qaračin qosiγu
183
+ - source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
184
+ expected: auqan qosiγu
185
+ - source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
186
+ expected: qodong arad-un toγoriγ
187
+ - source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
188
+ expected: sayiqan toγoriγ
189
+ - source: ᠰᠢᠨ᠎ᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
190
+ expected: sin-e qota toγoriγ
191
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
192
+ expected: qayirub-un toqoi toγoriγ
193
+ - source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
194
+ expected: süng šan toγoriγ
195
+ - source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
196
+ expected: küng šan toγoriγ
197
+ - source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
198
+ expected: arun qosiγu
199
+ - source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
200
+ expected: yuvan boo šan toγoriγ
201
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
202
+ expected: siluγun köbegetü čaγan qosiγu
203
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
204
+ expected: siluγun köke qosiγu
205
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
206
+ expected: urad-un dumdadu qosiγu
207
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
208
+ expected: urad-un emünedü qosiγu
209
+ - source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
210
+ expected: toγtaqu siyan
211
+ - source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
212
+ expected: söned ǰegün qosiγu
213
+ - source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
214
+ expected: söned baraγun qosiγu
215
+ - source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
216
+ expected: ongniγud qosiγu
217
+ - source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
218
+ expected: ǰalaid qosiγu
219
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
220
+ expected: qangγin qoyitu qosiγu
221
+ - source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
222
+ expected: ǰegün uǰumučin qosiγu
223
+ - source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
224
+ expected: aru qorčin qosiγu
225
+ - source: ᠠᠪᠠᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
226
+ expected: abaγ-a qosiγu
227
+ - source: ᠪᠤᠷᠢᠶᠠᠳ
228
+ expected: buriyad # Буриад
229
+ - source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
230
+ expected: ulaγanbaγatur
231
+ - source: ᠴᠢᠩᠭᠢᠰ ᠬᠠᠭᠠᠨ # Чингис Хаан
232
+ expected: čingγis qaγan
233
+
234
+ map:
235
+ rules:
236
+ - pattern: \u182c(\u1821|u1822|\u1825|\u1826)
237
+ result: "k\\1"
238
+ - pattern: \u182d(\u1821|u1822|\u1825|\u1826)
239
+ result: "g\\1"
240
+
241
+ characters:
242
+ "ᠠ": "a" # \u1820
243
+ "ᠡ": "e" # \u1821
244
+ "ᠢ": "i" # \u1822
245
+ "ᠣ": "o" # \u1823
246
+ "ᠤ": "u" # \u1824
247
+ "ᠥ": "ö" # \u1825
248
+ "ᠦ": "ü" # \u1826
249
+ "ᠨ": "n" # \u1828
250
+ "ᠩ": "ng" # \u1829
251
+ "ᠬ": "q" # \u182c
252
+ "ᠭ": "γ" # \u182d
253
+ "ᠪ": "b" # \u182a
254
+ "ᠫ": "p" # \u182b
255
+ "ᠹ": "f" # \u1839
256
+ "ᠰ": "s" # \u1830
257
+ "ᠱ": "š" # \u1831
258
+ "ᠲ": "t" # \u1832
259
+ "ᠳ": "d" # \u1833
260
+ "ᠯ": "l" # \u182f
261
+ "ᠮ": "m" # \u182e
262
+ "ᠴ": "č" # \u1834
263
+ "ᠵ": "ǰ" # \u1835
264
+ "ᠶ": "y" # \u1836
265
+ "ᠺ": "k" # \u183a
266
+ "ᠷ": "r" # \u1837
267
+ "ᠸ": "v" # \u1838
268
+ "ᠾ": "h" # \u183e
269
+ "᠁": "..." # \u1801
270
+ "᠂": "," # \u1802
271
+ "᠃": "." # \u1803
272
+ "᠄": ":" # \u1804
273
+ "\u180e": "-" # MVS
274
+ "\u202f": "-" # NNBSP
@@ -0,0 +1,30 @@
1
+ ---
2
+ authority_id: var
3
+ id: 1912
4
+ language: iso-639-2:pra
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: IAST Sanskrit Devanagari System
8
+ url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
9
+ creation_date: 1912
10
+ description:
11
+ The International Alphabet of Sanskrit Transliteration (IAST) is the academic standard for the romanisation
12
+ of Sanskrit. IAST is the de facto standard used in printed publications, like books, magazines, and electronic
13
+ texts with Unicode fonts. It is based on a standard established by the Congress of Orientalists at Athens in 1912.
14
+
15
+ The International Alphabet of Sanskrit Transliteration (IAST) is a transliteration scheme that allows the lossless
16
+ romanisation of Indic scripts[citation needed] as employed by Sanskrit and related Indic languages. It is based on a
17
+ scheme that emerged during the nineteenth century from suggestions by Charles Trevelyan, William Jones, Monier
18
+ Monier-Williams and other scholars, and formalised by the Transliteration Committee of the Geneva Oriental Congress,
19
+ in September 1894.IAST makes it possible for the reader to read the Indic text unambiguously, exactly as if it were
20
+ in the original Indic script. It is this faithfulness to the original scripts that accounts for its continuing popularity
21
+ amongst scholars.
22
+
23
+ notes:
24
+
25
+ tests:
26
+ - source: "नित्यः सर्वगतः स्थाणुरचलोऽयं सनातनः"
27
+ expected: "naitayaḥ saravagataḥ sathaāṇauracalao’yaṃ sanaātanaḥ"
28
+
29
+ map:
30
+ inherit: 'var-san-Deva-Latn-iast-1912'
@@ -0,0 +1,149 @@
1
+ ---
2
+ authority_id: var
3
+ id: 1912
4
+ language: iso-639-2:san
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: IAST Sanskrit Devanagari System
8
+ url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
9
+ creation_date: 1912
10
+ description:
11
+ The International Alphabet of Sanskrit Transliteration (IAST) is the academic standard for the romanisation
12
+ of Sanskrit. IAST is the de facto standard used in printed publications, like books, magazines, and electronic
13
+ texts with Unicode fonts. It is based on a standard established by the Congress of Orientalists at Athens in 1912.
14
+
15
+ The International Alphabet of Sanskrit Transliteration (IAST) is a transliteration scheme that allows the lossless
16
+ romanisation of Indic scripts[citation needed] as employed by Sanskrit and related Indic languages. It is based on a
17
+ scheme that emerged during the nineteenth century from suggestions by Charles Trevelyan, William Jones, Monier
18
+ Monier-Williams and other scholars, and formalised by the Transliteration Committee of the Geneva Oriental Congress,
19
+ in September 1894.IAST makes it possible for the reader to read the Indic text unambiguously, exactly as if it were
20
+ in the original Indic script. It is this faithfulness to the original scripts that accounts for its continuing popularity
21
+ amongst scholars.
22
+
23
+ notes:
24
+
25
+ tests:
26
+ - source: "पूर्णमदः पूर्णमिदं पूर्णात् पूर्ण्मुदच्यते"
27
+ expected: "paūraṇamadaḥ paūraṇamaidaṃ paūraṇaāta paūraṇamaudacayatae"
28
+ - source: "पूर्णस्य पूर्णमादाय पूर्णमेवावशिष्यते"
29
+ expected: "paūraṇasaya paūraṇamaādaāya paūraṇamaevaāvaśaiṣayatae"
30
+ - source: "यथा चतुर्भिः कनकं परीक्ष्यते निर्घषणच्छेदन तापताडनैः"
31
+ expected: "yathaā cataurabhaiḥ kanakaṃ paraīkaṣayatae nairaghaṣaṇacachaedana taāpataāḍanaaiḥ"
32
+ - source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
33
+ expected: "tathaā cataurabhaiḥ paurauṣaḥ paraīkaṣayatae tayaāgaena śaīlaena gauṇaena karamaṇaā"
34
+ - source: "यो न हृष्यति न द्वेष्टि न शोचति न काङ्‍क्षति"
35
+ expected: "yao na haṛṣayatai na davaeṣaṭai na śaocatai na kaāṅakaṣatai"
36
+ - source: "शुभाशुभपरित्यागी भक्तिमान्यः स मे प्रियः"
37
+ expected: "śaubhaāśaubhaparaitayaāgaī bhakataimaānayaḥ sa mae paraiyaḥ"
38
+ - source: "सत्य -सत्यमेवेश्वरो लोके सत्ये धर्मः सदाश्रितः"
39
+ expected: "sataya -satayamaevaeśavarao laokae satayae dharamaḥ sadaāśaraitaḥ"
40
+ - source: "सत्यमूलनि सर्वाणि सत्यान्नास्ति परं पदम्"
41
+ expected: "satayamaūlanai saravaāṇai satayaānanaāsatai paraṃ padama"
42
+ - source: "पिता माताग्निरात्मा च गुरुश्च भरतर्षभ"
43
+ expected: "paitaā maātaāganairaātamaā ca gaurauśaca bharataraṣabha"
44
+ - source: "अच्छेद्योऽयमदाह्योऽयमक्लेद्योऽशोष्य एव च "
45
+ expected: "acachaedayao’yamadaāhayao’yamakalaedayao’śaoṣaya eva ca "
46
+
47
+ map:
48
+
49
+ characters:
50
+
51
+ # I. Vowels and Diphthongs (see Note 1)
52
+
53
+ 'अ': 'a'
54
+ 'आ': 'ā'
55
+ 'इ': 'i'
56
+ 'ई': 'ī'
57
+ 'उ': 'u'
58
+ 'ऊ': 'ū'
59
+ 'ऋ': 'ṛ'
60
+ 'ॠ': 'ṝ'
61
+ 'ऌ': 'ḷ'
62
+ 'ॡ': 'ḹ'
63
+ 'ए': 'e'
64
+ 'ऐ': 'ai'
65
+ 'ओ': 'o'
66
+ 'औ': 'au'
67
+
68
+ # II. Consonants (see Note 2)
69
+ # Gutturals
70
+ 'क': 'ka'
71
+ 'ख': 'kha'
72
+ 'ग': 'ga'
73
+ 'घ': 'gha'
74
+ 'ङ': 'ṅa'
75
+
76
+ # Palatals
77
+ 'च': 'ca'
78
+ 'छ': 'cha'
79
+ 'ज': 'ja'
80
+ 'झ': 'jha'
81
+ 'ञ': 'ña'
82
+
83
+ # Cerebrals
84
+ 'ट': 'ṭa'
85
+ 'ठ': 'ṭha'
86
+ 'ड': 'ḍa'
87
+ 'ढ': 'ḍha'
88
+ 'ण': 'ṇa'
89
+
90
+ # Dentals
91
+ 'त': 'ta'
92
+ 'थ': 'tha'
93
+ 'द': 'da'
94
+ 'ध': 'dha'
95
+ 'न': 'na'
96
+
97
+ # Labials
98
+ 'प': 'pa'
99
+ 'फ': 'pha'
100
+ 'ब': 'ba'
101
+ 'भ': 'bha'
102
+ 'म': 'ma'
103
+
104
+ # Semivowels
105
+ 'य': 'ya'
106
+ 'र': 'ra'
107
+ 'ल': 'la'
108
+ 'व': 'va'
109
+
110
+ # Sibilants
111
+ 'श': 'śa'
112
+ 'ष': 'ṣa'
113
+ 'स': 'sa'
114
+
115
+ # Aspirate
116
+ 'ह': 'ha'
117
+
118
+ # Anusvāra
119
+ 'ं': 'ṃ'
120
+ 'अं': 'ṃ'
121
+
122
+ # Bisarga
123
+ 'ः': 'ḥ'
124
+ 'अः': 'ḥ'
125
+
126
+ # Anunāsika
127
+ 'ँ': 'm̐'
128
+ 'अँ': 'm̐'
129
+
130
+ # Abagraha
131
+ 'ऽ': '’' # (apostrophe)
132
+
133
+
134
+ # Medials # Needed for connecting constants
135
+ 'ा': "ā"
136
+ 'ि': "i"
137
+ 'ी': "ī"
138
+ 'ु': "u"
139
+ 'ू': "ū"
140
+ 'ृ': "ṛ"
141
+ 'ॄ': "ṝ"
142
+ 'ॢ': "ḷ"
143
+ 'ॣ': "ḹ"
144
+ 'े': "e"
145
+ 'ै': "ai"
146
+ 'ो': "o"
147
+ 'ौ': "au"
148
+ '्': ""
149
+ '‍': ''# Used for joining