interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,264 @@
1
+ ---
2
+ authority_id: un
3
+ id: phonetic-2013
4
+ language: iso-639-2:mon
5
+ source_script: Mong
6
+ destination_script: Latn
7
+ name: Mongolian Romanization in China, Version 4.0 (phonetic)
8
+ url: http://www.eki.ee/wgrs/rom1_mnc.htm
9
+ creation_date: 2013-09
10
+ description: |
11
+ The United Nations resolution III/8 in 1977 recognized the Scheme for
12
+ a Chinese Phonetic Alphabet (Pinyin) as China’s official Roman alphabet
13
+ scheme and recommended the alphabet as the international system for the
14
+ romanization of Chinese geographical names. In China Mongolian
15
+ geographical names are transcribed directly from the Mongolian script
16
+ into Pinyin. The scheme was published in Toponymic Guidelines for Map
17
+ and Other Editors: China, 1982.
18
+
19
+ The system is used in China and in international cartographic
20
+ products.
21
+
22
+ Mongolian uses a vertical script. Transcription of Mongolian names is
23
+ made from their proper pronunciation based on the written form of the
24
+ Mongolian language and Qahar vernacular, with Zhenglan as its
25
+ representative pronunciation. Due to the complex nature of the script
26
+ the romanization scheme is not reversible, e.g. the name of the city
27
+ Hohhot is written ᠬᠥᠬᠡᠬᠣᠲᠠ but may be transliterated as kökeqota.
28
+
29
+ notes:
30
+ - The long and short Mongolian vowels are not distinguished in the
31
+ spelling for general use, but in recording the pronunciation of
32
+ place-names, the long vowel is represented by duplication.
33
+ - Where two Roman equivalents are given, the second (in brackets) is
34
+ used for recording the pronunciation of place-names while the first
35
+ form is for general use.
36
+ - In the table only word-initial character variants are shown.
37
+ Depending on the position in the word many variants of the characters
38
+ are used as well as some ligatures. These features are not covered here.
39
+ - For technical reasons the characters of the Mongolian script are
40
+ turned 90˚ anti-clockwise.
41
+
42
+ implementation_notes:
43
+ - A separated final form of vowels a or e is common, and can appear at the end
44
+ of a word, word stem, or suffix. This form requires a final-shaped preceding
45
+ consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
46
+ and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
47
+ with a hyphen. In digital typesetting, these forms are triggered by inserting
48
+ a U+180E ᠎ MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
49
+ and vowel.
50
+ - All case suffixes, as well as any plural suffixes consisting of one or two
51
+ syllables are likewise separated by a preceding and hyphen-transliterated gap.
52
+ In digital typesetting, this gap is represented by a U+202F   NARROW NO-BREAK SPACE
53
+ (HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
54
+ Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
55
+ as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
56
+ 'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
57
+ medial- (vowels), or variant-shaped form.
58
+
59
+ tests:
60
+ - source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
61
+ expected: ôrdôs hôta
62
+ - source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
63
+ expected: bayannagûr hôta
64
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
65
+ expected: ûlaganhôta
66
+ - source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
67
+ expected: hôôlia gôûl hôta
68
+ - source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
69
+ expected: eriyen hôta
70
+ - source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
71
+ expected: rasiyan hôta
72
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
73
+ expected: bagarin baragûn hôsigû
74
+ - source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
75
+ expected: bagarin jegun hôsigû
76
+ - source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
77
+ expected: tungliyôû hôta
78
+ - source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
79
+ expected: sili-yin hôta
80
+ - source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
81
+ expected: hôrin ger siyan
82
+ - source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
83
+ expected: ûda tôgôrig
84
+ - source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
85
+ expected: uhai hôta
86
+ - source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
87
+ expected: hayinan tôgôrig
88
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
89
+ expected: hayirûb-ûn tôhôi tôgôrig
90
+ - source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
91
+ expected: ûlaganqab hôta
92
+ - source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
93
+ expected: jining tôgôrig
94
+ - source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
95
+ expected: fwngjwe hôta
96
+ - source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
97
+ expected: juwezi siyan
98
+ - source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
99
+ expected: hûwade siyan
100
+ - source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
101
+ expected: xangdû siyan
102
+ - source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
103
+ expected: singhe siyan
104
+ - source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
105
+ expected: liyangqang siyan
106
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
107
+ expected: qahar baragûn garûn emunedu hôsigû
108
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
109
+ expected: qahar baragûn garûn dûmdadû hôsigû
110
+ - source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
111
+ expected: qahar baragûn garûn hôyitû hôsigû
112
+ - source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
113
+ expected: dorbed hôsigû
114
+ - source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
115
+ expected: bûgûtû hôta
116
+ - source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
117
+ expected: hondelen tôgôrig
118
+ - source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
119
+ expected: dunghe tôgôrig
120
+ - source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
121
+ expected: qingxan tôgôrig
122
+ - source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
123
+ expected: sigûyitû tôgôrig
124
+ - source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
125
+ expected: jiu yûwan tôgôrig
126
+ - source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
127
+ expected: guyang siyan
128
+ - source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
129
+ expected: tumed jegun hôsigû
130
+ - source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
131
+ expected: tumed baragûn hôsigû
132
+ - source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
133
+ expected: darhan mûûmingg᠋an hôlbôgatû hôsigû
134
+ - source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
135
+ expected: hesigten hôsigû
136
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
137
+ expected: sin-e bargû jegun hôsigû
138
+ - source: ᠰᠢᠨ᠎ᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
139
+ expected: sin-e bargû baragûn hôsigû
140
+ - source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
141
+ expected: ôtôg hôsigû
142
+ - source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
143
+ expected: d᠋ungxeng tôgôrig
144
+ - source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
145
+ expected: dalad hôsigû
146
+ - source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
147
+ expected: jegungar hôsigû
148
+ - source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
149
+ expected: ôtôg-ûn emunedu hôsigû
150
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
151
+ expected: hanggin hôsigû
152
+ - source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
153
+ expected: uusin hôsigû
154
+ - source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
155
+ expected: ejin hôrôg-a hôsigû
156
+ - source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
157
+ expected: jalan ai᠌l hôta
158
+ - source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
159
+ expected: yagsi hôta
160
+ - source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
161
+ expected: manjûûr hôta
162
+ - source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
163
+ expected: hayilar tôgôrig
164
+ - source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
165
+ expected: hôrqin tôgôrig
166
+ - source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
167
+ expected: kayilu siyan
168
+ - source: ᠬᠦᠷᠢᠶ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
169
+ expected: huriy-e hôsigû
170
+ - source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
171
+ expected: naiman hôsigû
172
+ - source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
173
+ expected: jarûd hôsigû
174
+ - source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
175
+ expected: hôrqin baragûn garûn dûmdadû hôsigû
176
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
177
+ expected: hôrqin jegun garûn dûmdadû hôsigû
178
+ - source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
179
+ expected: hôrqin jegun garûn hôyitû hôsigû
180
+ - source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
181
+ expected: ûlaganhada hôta
182
+ - source: ᠰᠡᠷᠡᠴᠢ # Salaqi
183
+ expected: sereqi
184
+ - source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
185
+ expected: gegen gôûl hôta
186
+ - source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
187
+ expected: alaxa jegun hôsigû
188
+ - source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
189
+ expected: alaxa baragûn hôsigû
190
+ - source: ᠡᠵᠡᠨ᠎ᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
191
+ expected: ejen-e hôsigû
192
+ - source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
193
+ expected: hobegetu sir-a hôsigû
194
+ - source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
195
+ expected: uyûwan siyan
196
+ - source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
197
+ expected: uqûwan siyan
198
+ - source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
199
+ expected: tuqiûwan siyan
200
+ - source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
201
+ expected: ningqeng siyan
202
+ - source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
203
+ expected: linsi siyan
204
+ - source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
205
+ expected: linhe tôgôrig
206
+ - source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
207
+ expected: haraqin hôsigû
208
+ - source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
209
+ expected: d᠋engkeu siyan
210
+ - source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
211
+ expected: aûhan hôsigû
212
+ - source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
213
+ expected: qing xui he siyan
214
+ - source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
215
+ expected: hôdông arad-ûn tôgôrig
216
+ - source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
217
+ expected: sayihan tôgôrig
218
+ - source: ᠰᠢᠨ᠎ᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
219
+ expected: sin-e hôta tôgôrig
220
+ - source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
221
+ expected: hayirûb-ûn tôhôi tôgôrig
222
+ - source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
223
+ expected: sung xan tôgôrig
224
+ - source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
225
+ expected: hung xan tôgôrig
226
+ - source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
227
+ expected: arûn hôsigû
228
+ - source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
229
+ expected: yûwan bôô xan tôgôrig
230
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
231
+ expected: silûgûn hobegetu qagan hôsigû
232
+ - source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
233
+ expected: silûgûn hohe hôsigû
234
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
235
+ expected: ûrad-ûn dûmdadû hôsigû
236
+ - source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
237
+ expected: ûrad-ûn emunedu hôsigû
238
+ - source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
239
+ expected: tôgtahû siyan
240
+ - source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
241
+ expected: tayipûse hôsigû
242
+ - source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
243
+ expected: soned jegun hôsigû
244
+ - source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
245
+ expected: soned baragûn hôsigû
246
+ - source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
247
+ expected: ôngnigûd hôsigû
248
+ - source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
249
+ expected: jalaid hôsigû
250
+ - source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
251
+ expected: hanggin hôyitû hôsigû
252
+ - source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
253
+ expected: jegun ûjûmûqin hôsigû
254
+ - source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
255
+ expected: arû hôrqin hôsigû
256
+ - source: ᠠᠪᠠᠭ᠎ᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
257
+ expected: abag-a hôsigû
258
+ - source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
259
+ expected: bûriyad
260
+ - source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
261
+ expected: ûlaganbagatûr
262
+
263
+ map:
264
+ inherit: sasm-mon-Mong-Latn-phonetic-1978
@@ -0,0 +1,350 @@
1
+ ---
2
+ authority_id: ungegn
3
+ id: 1972
4
+ language: iso-639-2:nep
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
8
+ url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
9
+ creation_date: 1972
10
+ confirmation_date: 2010
11
+ description: |
12
+ The United Nations recommended system was approved in 1972 (II/11), based on a report
13
+ prepared by D. N. Sharma. The note on the system was published in volume II of the
14
+ conference report.
15
+
16
+ There is no evidence of the use of the system either in Nepal or in international cartographic
17
+ products. The resolution IV/17 (1982) recommended association, inter alia, with Nepal in
18
+ carrying out further studies on the system. In Nepal a system of romanization is employed by
19
+ the Nepal Survey Department (NSD). This system has been applied to names appearing on
20
+ national mapping, and it is also used in the Geographic Information Infrastructure Programme
21
+ (NGIIP).
22
+
23
+ Nepali (Nepālī) uses the alphasyllabic script Devanāgarī.
24
+
25
+ notes:
26
+
27
+ - In normal spelling ṙ and ṙh are not marked, instead dotless ड ḍa, ढ ḍha are used to denote these sounds.
28
+ - |
29
+ Ligatures may be formed with r as the first component: ~ह rha.
30
+
31
+ ######################################## Additional Note ############################################################
32
+ # It is recommended that the vowel अ (a) should always be romanized except when it ends a #
33
+ # name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
34
+ # we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
35
+ # so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
36
+ #####################################################################################################################
37
+
38
+
39
+ tests:
40
+ - source: "नेपाल"
41
+ expected: "nepāl"
42
+ - source: "नेपाल काठ्माडौं"
43
+ expected: "nepāl kāṭhmāḍauṁ"
44
+ - source: "लेखन"
45
+ expected: "lekhan"
46
+ - source: "मुद्रा"
47
+ expected: "mudrā"
48
+ - source: "प्रशंसा"
49
+ expected: "prashaṁsā"
50
+ - source: "अंक"
51
+ expected: "aṁk"
52
+ - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
53
+ expected: "nekapāle sthagit sthāyī kamiṭīko baiṭhak bhadau gate bolāune bhaeko"
54
+ - source: "न घर रह्यो, न परिवार"
55
+ expected: "n ghar rahyo, n parivār"
56
+ - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
57
+ expected: "ḍhorapāṭanamā bhujīkholā bāḍhīpahirole abhibhāvak gumāekā bālabālikāko bichallī"
58
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
59
+ expected: "susmitākā kākā hemabahādur r kākīlāī pani pahirole bagāyo"
60
+ - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
61
+ expected: "saṁvidhān jārī bhaesam̐gai sārvajanik prashāsanamā nayām̐ utsāh āune apekṣhā thiyo"
62
+ - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
63
+ expected: "deshamā koronā saṁkramit r mṛtakako saṁkhyā harek din baḍhdo chh"
64
+ - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
65
+ expected: "gāum̐pālikākā adhyakṣh ṭikā guruṅakā anusār viṣhṇudāsalāī rājule sutnakā lāgi belukā sāthī lagekā thie"
66
+ - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
67
+ expected: "yo āyojanā gāum̐pālikāko kendr tellokamā parchh"
68
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
69
+ expected: "susmitākā kākā hemabahādur r kākīlāī pani pahirole bagāyo"
70
+ - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
71
+ expected: "chait pahilo sātā ghar āekā unī lakaḍāun bhaepachhi yatai rokie"
72
+ - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
73
+ expected: "kām garn jāneko hakamā rojagāradātā kampanīko patrasam̐gai vaḍā r jillā prashāsanako siphāris anivāry garieko chh"
74
+ - source: "ऋण"
75
+ expected: "ṛṇ"
76
+ - source: "अर्पित"
77
+ expected: "arpit"
78
+ - source: "अरार्यते"
79
+ expected: "arāryate"
80
+ - source: "श्रीमान्"
81
+ expected: "shrīmān"
82
+ - source: "खाँचो बिरुवा बैंकको"
83
+ expected: "khām̐cho biruvā baiṁkako"
84
+
85
+
86
+ map:
87
+
88
+ rules:
89
+ - pattern: ([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
90
+ result: 'k'
91
+ - pattern: ([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
92
+ result: 'kh'
93
+ - pattern: ([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
94
+ result: 'g'
95
+ - pattern: ([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
96
+ result: 'gh'
97
+ - pattern: ([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
98
+ result: 'ṅ'
99
+ - pattern: ([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
100
+ result: 'ch'
101
+ - pattern: ([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
102
+ result: 'chh'
103
+ - pattern: ([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
104
+ result: 'j'
105
+ - pattern: ([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
106
+ result: 'jh'
107
+ - pattern: ([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
108
+ result: 'ñ'
109
+ - pattern: ([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
110
+ result: 'ṭ'
111
+ - pattern: ([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
112
+ result: 'ṭh'
113
+ - pattern: ([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
114
+ result: 'ḍ'
115
+ - pattern: ([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
116
+ result: 'ḍh'
117
+ - pattern: ([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
118
+ result: 'ṇ'
119
+ - pattern: ([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
120
+ result: 't'
121
+ - pattern: ([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
122
+ result: 'th'
123
+ - pattern: ([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
124
+ result: 'd'
125
+ - pattern: ([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
126
+ result: 'dh'
127
+ - pattern: ([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
128
+ result: 'n'
129
+ - pattern: ([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
130
+ result: 'p'
131
+ - pattern: ([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
132
+ result: 'ph'
133
+ - pattern: ([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
134
+ result: 'b'
135
+ - pattern: ([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
136
+ result: 'bh'
137
+ - pattern: ([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
138
+ result: 'm'
139
+ - pattern: ([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
140
+ result: 'y'
141
+ - pattern: ([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
142
+ result: 'r'
143
+ - pattern: ([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
144
+ result: 'l'
145
+ - pattern: ([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
146
+ result: 'v'
147
+ - pattern: ([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
148
+ result: 'sh'
149
+ - pattern: ([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
150
+ result: 'ṣh'
151
+ - pattern: ([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
152
+ result: 's'
153
+ - pattern: ([क़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
154
+ result: 'q'
155
+ - pattern: ([ख़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
156
+ result: 'ḳh'
157
+ - pattern: ([ग़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
158
+ result: 'g'
159
+ - pattern: ([ज़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
160
+ result: 'z'
161
+ - pattern: ([ड़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
162
+ result: 'ṙ'
163
+ - pattern: ([ढ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
164
+ result: 'ṙh'
165
+ - pattern: ([फ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
166
+ result: 'f'
167
+ - pattern: ([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
168
+ result: 'h'
169
+
170
+
171
+ - pattern: ([क])(?=\b)
172
+ result: 'k'
173
+ - pattern: ([ख])(?=\b)
174
+ result: 'kh'
175
+ - pattern: ([ग])(?=\b)
176
+ result: 'g'
177
+ - pattern: ([घ])(?=\b)
178
+ result: 'gh'
179
+ - pattern: ([ङ])(?=\b)
180
+ result: 'ṅ'
181
+ - pattern: ([च])(?=\b)
182
+ result: 'ch'
183
+ - pattern: ([छ])(?=\b)
184
+ result: 'chh'
185
+ - pattern: ([ज])(?=\b)
186
+ result: 'j'
187
+ - pattern: ([झ])(?=\b)
188
+ result: 'jh'
189
+ - pattern: ([ञ])(?=\b)
190
+ result: 'ñ'
191
+ - pattern: ([ट])(?=\b)
192
+ result: 'ṭ'
193
+ - pattern: ([ठ])(?=\b)
194
+ result: 'ṭh'
195
+ - pattern: ([ड])(?=\b)
196
+ result: 'ḍ'
197
+ - pattern: ([ढ])(?=\b)
198
+ result: 'ḍh'
199
+ - pattern: ([ण])(?=\b)
200
+ result: 'ṇ'
201
+ - pattern: ([त])(?=\b)
202
+ result: 't'
203
+ - pattern: ([थ])(?=\b)
204
+ result: 'th'
205
+ - pattern: ([द])(?=\b)
206
+ result: 'd'
207
+ - pattern: ([ध])(?=\b)
208
+ result: 'dh'
209
+ - pattern: ([न])(?=\b)
210
+ result: 'n'
211
+ - pattern: ([प])(?=\b)
212
+ result: 'p'
213
+ - pattern: ([फ])(?=\b)
214
+ result: 'ph'
215
+ - pattern: ([ब])(?=\b)
216
+ result: 'b'
217
+ - pattern: ([भ])(?=\b)
218
+ result: 'bh'
219
+ - pattern: ([म])(?=\b)
220
+ result: 'm'
221
+ - pattern: ([य])(?=\b)
222
+ result: 'y'
223
+ - pattern: ([र])(?=\b)
224
+ result: 'r'
225
+ - pattern: ([ल])(?=\b)
226
+ result: 'l'
227
+ - pattern: ([व])(?=\b)
228
+ result: 'v'
229
+ - pattern: ([श])(?=\b)
230
+ result: 'sh'
231
+ - pattern: ([ष])(?=\b)
232
+ result: 'ṣh'
233
+ - pattern: ([स])(?=\b)
234
+ result: 's'
235
+ - pattern: ([क़])(?=\b)
236
+ result: 'q'
237
+ - pattern: ([ख़])(?=\b)
238
+ result: 'ḳh'
239
+ - pattern: ([ग़])(?=\b)
240
+ result: 'g'
241
+ - pattern: ([ज़])(?=\b)
242
+ result: 'z'
243
+ - pattern: ([ड़])(?=\b)
244
+ result: 'ṙ'
245
+ - pattern: ([ढ़])(?=\b)
246
+ result: 'ṙh'
247
+ - pattern: ([फ़])(?=\b)
248
+ result: 'f'
249
+ - pattern: ([ह])(?=\b)
250
+ result: 'h'
251
+
252
+ characters:
253
+
254
+ # Vowels and Diphthongs
255
+ 'अ': 'a'
256
+ 'आ': 'ā'
257
+ 'इ': 'i'
258
+ 'ई': 'ī'
259
+ 'उ': 'u'
260
+ 'ऊ': 'ū'
261
+ 'ऋ': 'ṛ'
262
+ 'ॠ': 'ṝ'
263
+ 'ऌ': 'l̤'
264
+ 'ए': 'e'
265
+ 'ऐ': 'ai'
266
+ 'ओ': 'o'
267
+ 'औ': 'au'
268
+
269
+ # Medials # Needed for connecting constants
270
+
271
+ 'ा': "ā"
272
+ 'ि': "i"
273
+ 'ी': "ī"
274
+ 'ु': "u"
275
+ 'ू': "ū"
276
+ 'ृ': "ṛ"
277
+ 'े': "e"
278
+ 'ै': "ai"
279
+ 'ो': "o"
280
+ 'ौ': "au"
281
+
282
+ # Consonants (see Note 1)
283
+
284
+ # Gutturals
285
+ 'क': 'ka'
286
+ 'ख': 'kha'
287
+ 'ग': 'ga'
288
+ 'घ': 'gha'
289
+ 'ङ': 'ṅa'
290
+
291
+ # Palatals
292
+ 'च': 'cha'
293
+ 'छ': 'chha'
294
+ 'ज': 'ja'
295
+ 'झ': 'jha'
296
+ 'ञ': 'ña'
297
+
298
+ # Cerebrals
299
+ 'ट': 'ṭa'
300
+ 'ठ': 'ṭha'
301
+ 'ड': 'ḍa'
302
+ 'ढ': 'ḍha'
303
+ 'ण': 'ṇa'
304
+
305
+ # Dentals
306
+ 'त': 'ta'
307
+ 'थ': 'tha'
308
+ 'द': 'da'
309
+ 'ध': 'dha'
310
+ 'न': 'na'
311
+
312
+ # Labials
313
+ 'प': 'pa'
314
+ 'फ': 'pha'
315
+ 'ब': 'ba'
316
+ 'भ': 'bha'
317
+ 'म': 'ma'
318
+
319
+ # Semivowels
320
+ 'य': 'ya'
321
+ 'र': 'ra'
322
+ 'ल': 'la'
323
+ 'व': 'va' # or wa [Note#3]
324
+
325
+ # Sibilants
326
+ 'श': 'sha'
327
+ 'ष': 'ṣha'
328
+ 'स': 'sa'
329
+
330
+ # Dotted variants
331
+ 'क़': qa
332
+ 'ख़': ḳha
333
+ 'ग़': ga
334
+ 'ज़': za
335
+ 'ड़': ṙa
336
+ 'ढ़': ṙha
337
+ 'फ़': fa
338
+
339
+
340
+ # Aspirate
341
+ 'ह': 'ha'
342
+
343
+ # Anusvāra
344
+ 'ं': 'ṁ'
345
+
346
+ # Anunāsika
347
+ 'ँ': 'm̐'
348
+
349
+ # halanta
350
+ '्': ''