interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,190 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2013
4
+ language: iso-639-2:mkd
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Makedonian Romanization, BGN/PCGN 2013 System
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
9
+ creation_date: 2013
10
+ description: |
11
+ Macedonian was officially established as a written language in Yugoslavia during
12
+ World War II and is now the official language of North Macedonia.
13
+ This romanization system replaces the BGN/PCGN 1981 agreement and adheres
14
+ to the most widely-accepted standardization of Macedonian orthography.
15
+
16
+ notes:
17
+ - The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
18
+ There is no specific Unicode encoding for this variant form so a comparable character
19
+ has been used here for illustrative purposes.
20
+ - The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
21
+ There is no specific Unicode encoding for this variant form so a comparable character
22
+ has been used here for illustrative purposes.
23
+ - The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
24
+ There is no specific Unicode encoding for this variant form so a comparable character
25
+ has been used here for illustrative purposes.
26
+ - The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
27
+ There is no specific Unicode encoding for this variant form so a comparable character
28
+ has been used here for illustrative purposes.
29
+ - |
30
+ An inventory of letter-diacritic combinations, with their Unicode encoding,
31
+ in addition to the unmodified letters of the basic Roman script is:
32
+ | Ǵ (U+01F4) | ǵ (U+01F5) |
33
+ | Ž (U+017D) | ž (U+017E) |
34
+ | Dz (U+01F2)* | dz (U+01F3)* |
35
+ | Lj (U+01C8)* | lj (U+01C9)* |
36
+ | Nj (U+01CB)* | nj(U+01CC)* |
37
+ | Ḱ (U+IE30) | ḱ (U+IE31) |
38
+ | Č (U+010C) | č (U+010D) |
39
+ | Dž (U+01C5)* | dž (U+01C6)* |
40
+ | Š (U+0160) | š (U+0161) |
41
+ * Note that these characters can also be reproduced with individual letters (e.g. l+j).
42
+ - The Romanization column shows only lowercase forms but, when romanizing,
43
+ uppercase and lowercase Roman letters as appropriate should be used.
44
+
45
+ tests:
46
+ - source: Ѓенови Ливаѓе
47
+ expected: Ǵenovi Livaǵe
48
+ - source: ЛУЃЕ луѓе
49
+ expected: LUǴE luǵe
50
+ - source: ЅВЕЗДА ѕвезда Ѕвезда
51
+ expected: DZVEZDA dzvezda Dzvezda
52
+ - source: Јабежица
53
+ expected: Jabežica
54
+ - source: Љиќен и Бард
55
+ expected: Ljiḱen i Bard
56
+ - source: Ќамилов Чукар
57
+ expected: Ḱamilov Čukar
58
+ - source: Џавидин Кајнак
59
+ expected: Džavidin Kajnak
60
+ - source: Џамалџи
61
+ expected: Džamaldži
62
+ - source: Џибра Гури и Зи
63
+ expected: Džibra Guri i Zi
64
+ - source: Абазова Куќарица
65
+ expected: Abazova Kuḱarica
66
+ - source: Баба Анѓина Маала
67
+ expected: Baba Anǵina Maala
68
+ - source: Ваљановец
69
+ expected: Valjanovec
70
+ - source: Галал Једи Дереш
71
+ expected: Galal Jedi Dereš
72
+ - source: Дванаесет Клајнци
73
+ expected: Dvanaeset Klajnci
74
+ - source: Електродистрибуција Струга
75
+ expected: Elektrodistribucija Struga
76
+ - source: Железничка Станица Рајко Жинзифов
77
+ expected: Železnička Stanica Rajko Žinzifov
78
+ - source: Заедничко Речиште
79
+ expected: Zaedničko Rečište
80
+ - source: Испраена Плоча
81
+ expected: Ispraena Ploča
82
+ - source: Казнено-Поправна Установа Идризово
83
+ expected: Kazneno-Popravna Ustanova Idrizovo
84
+ - source: Лази и Зејнелит
85
+ expected: Lazi i Zejnelit
86
+ - source: Мавровско Езеро
87
+ expected: Mavrovsko Ezero
88
+ - source: Национален Парк Галичица
89
+ expected: Nacionalen Park Galičica
90
+ - source: Одморалиште Свети Стефан
91
+ expected: Odmoralište Sveti Stefan
92
+ - source: Планинарски Дом Караџица
93
+ expected: Planinarski Dom Karadžica
94
+ - source: Раса е Лисењит
95
+ expected: Rasa e Lisenjit
96
+ - source: Скочивирска Клисура
97
+ expected: Skočivirska Klisura
98
+ - source: Термо-електроцентрала Неготино
99
+ expected: Termo-elektrocentrala Negotino
100
+ - source: Узуновско Бресје
101
+ expected: Uzunovsko Bresje
102
+ - source: Фабрика Југохром
103
+ expected: Fabrika Jugohrom
104
+ - source: Хидроелектрана Сапунџица
105
+ expected: Hidroelektrana Sapundžica
106
+ - source: Цветковско Рамниште
107
+ expected: Cvetkovsko Ramnište
108
+ - source: Чалтанова Пештера
109
+ expected: Čaltanova Peštera
110
+ - source: Шкемби Вишнејц
111
+ expected: Škembi Višnejc
112
+
113
+ map:
114
+ postrules:
115
+ # DZ
116
+ - pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
117
+ result: "DZ"
118
+ #LJ
119
+ - pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
120
+ result: "LJ"
121
+ #NJ
122
+ - pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
123
+ result: "NJ"
124
+ #DŽ
125
+ - pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
126
+ result: "DŽ"
127
+
128
+ characters:
129
+ "\u0410": "A"
130
+ "\u0411": "B"
131
+ "\u0412": "V"
132
+ "\u0413": "G"
133
+ "\u0414": "D"
134
+ "\u0403": "\u01F4" # Ǵ
135
+ "\u0415": "E"
136
+ "\u0416": "\u005a\u030c" # Ž
137
+ "\u0417": "Z"
138
+ "\u0405": "Dz"
139
+ "\u0418": "I"
140
+ "\u0408": "J"
141
+ "\u041A": "K"
142
+ "\u041B": "L"
143
+ "\u0409": "Lj"
144
+ "\u041C": "M"
145
+ "\u041D": "N"
146
+ "\u040A": "Nj"
147
+ "\u041E": "O"
148
+ "\u041F": "P"
149
+ "\u0420": "R"
150
+ "\u0421": "S"
151
+ "\u0422": "T"
152
+ "\u040C": "\u004b\u0301" # Ḱ
153
+ "\u0423": "U"
154
+ "\u0424": "F"
155
+ "\u0425": "H"
156
+ "\u0426": "C"
157
+ "\u0427": "\u0043\u030c" # Č
158
+ "\u040F": "D\u007a\u030c" # Dž
159
+ "\u0428": "\u0053\u030c" # Š
160
+ "\u0430": "a"
161
+ "\u0431": "b"
162
+ "\u0432": "v"
163
+ "\u0433": "g"
164
+ "\u0434": "d"
165
+ "\u0453": "\u01F5" # ǵ
166
+ "\u0435": "e"
167
+ "\u0436": "\u007a\u030c" # ž
168
+ "\u0437": "z"
169
+ "\u0455": "dz"
170
+ "\u0438": "i"
171
+ "\u0458": "j"
172
+ "\u043A": "k"
173
+ "\u043B": "l"
174
+ "\u0459": "lj"
175
+ "\u043C": "m"
176
+ "\u043D": "n"
177
+ "\u045A": "nj"
178
+ "\u043E": "o"
179
+ "\u043F": "p"
180
+ "\u0440": "r"
181
+ "\u0441": "s"
182
+ "\u0442": "t"
183
+ "\u045C": "\u1E31" # ḱ
184
+ "\u0443": "u"
185
+ "\u0444": "f"
186
+ "\u0445": "h"
187
+ "\u0446": "c"
188
+ "\u0447": "\u0063\u030c" # č
189
+ "\u045F": "d\u007a\u030c" # dž
190
+ "\u0448": "\u0073\u030c" # š
@@ -0,0 +1,223 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1964
4
+ language: iso-639-2:mon
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: BGN/PCGN 1964 System
8
+ alias:
9
+ ogc11122:
10
+ code: mon_Cyrl2Latn_BGN_1964
11
+ description: Mongolian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1964 System
12
+ url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
13
+ creation_date:
14
+ confirmation_date:
15
+ description: |
16
+ This system was originated by the PCGN in 1957 and adopted as a
17
+ BGN/PCGN System in 1964. It is intended for use in the romanization of
18
+ geographic names in the "Mongolian People's Republic" but not to romanize
19
+ Mongolian names in adjacent parts of China and the U.S.S.R.
20
+
21
+ notes: |
22
+ - b occurs initially and after л, м, and б.
23
+ - v occurs medially in Mongolian words and initially in foreign words.
24
+ - y occurs only as the second element of diphthongs.
25
+ - k, p, f, and shch occurs foreign words only.
26
+ - "\u2019" occurs only in Russion words.
27
+ - ï occurs only in suffixes to words containing back vowels (a, o, and u).
28
+ - In monosyllables yu or yü depending on pronunciation; in polysyllables yu when followed by a, o, or u, but yü when followed by i, e, ö, or ü.
29
+
30
+ tests:
31
+ - source: Эрдэнэт Сум
32
+ expected: Erdenet Sum
33
+ - source: Эрдэнэт
34
+ expected: Erdenet
35
+ - source: Эрдэнэ
36
+ expected: Erdene
37
+ - source: Шивээговь Сум
38
+ expected: Shiveegovĭ Sum
39
+ - source: Шивээговь
40
+ expected: Shiveegovĭ
41
+ - source: Шарынгол Сум
42
+ expected: Sharïngol Sum
43
+ - source: Шарынгол
44
+ expected: Sharïngol
45
+ - source: Цагааннуур
46
+ expected: Tsagaannuur
47
+ - source: Хонгор Сум
48
+ expected: Hongor Sum
49
+ - source: Хонгор
50
+ expected: Hongor
51
+ - source: Хайлаастай
52
+ expected: Haylaastay
53
+ - source: Түнэл Сум
54
+ expected: Tünel Sum
55
+ - source: Түнэл
56
+ expected: Tünel
57
+ - source: Сүхбаатар
58
+ expected: Sühbaatar
59
+ - source: Сүмбэр Сум
60
+ expected: Sümber Sum
61
+ - source: Сүмбэр
62
+ expected: Sümber
63
+ - source: Сайншанд Сум
64
+ expected: Saynshand Sum
65
+ - source: Сайншанд
66
+ expected: Saynshand
67
+ - source: Орхон Сум
68
+ expected: Orhon Sum
69
+ - source: Орхон
70
+ expected: Orhon
71
+ - source: Нарст
72
+ expected: Narst
73
+ - source: Мөрөн Сум
74
+ expected: Mörön Sum
75
+ - source: Мөрөн
76
+ expected: Mörön
77
+ - source: Зүүнхөвөө
78
+ expected: Dzüünhövöö
79
+ - source: Жаргалант Сум
80
+ expected: Jargalant Sum
81
+ - source: Жаргалант
82
+ expected: Jargalant
83
+ - source: Дархан Сум
84
+ expected: Darhan Sum
85
+ - source: Даланзадгад Сум
86
+ expected: Dalandzadgad Sum
87
+ - source: Даланзадгад
88
+ expected: Dalandzadgad
89
+ - source: Давст Сум
90
+ expected: Davst Sum
91
+ - source: Давст
92
+ expected: Davst
93
+ - source: Говьсүмбэр Сум
94
+ expected: Govĭsümber Sum
95
+ - source: Говь
96
+ expected: Govĭ
97
+ - source: Буга
98
+ expected: Buga
99
+ - source: Бор-Өндөр Сум
100
+ expected: Bor-Öndör Sum
101
+ - source: Бор-Өндөр
102
+ expected: Bor-Öndör
103
+ - source: Баянхонгор
104
+ expected: Bayanhongor
105
+ - source: Баянтал
106
+ expected: Bayantal
107
+ - source: Баяндэлгэр Сум
108
+ expected: Bayandelger Sum
109
+ - source: Баяндэлгэр
110
+ expected: Bayandelger
111
+ - source: Баян-Өндөр Сум
112
+ expected: Bayan-Öndör Sum
113
+ - source: Баруун-Урт Сум
114
+ expected: Baruun-Urt Sum
115
+ - source: Баруун-Урт
116
+ expected: Baruun-Urt
117
+ - source: Архуст
118
+ expected: Arhust
119
+ - source: Арвайхээр Сум
120
+ expected: Arvayheer Sum
121
+ - source: Арвайхээр
122
+ expected: Arvayheer
123
+ - source: Есөнбулаг Сум
124
+ expected: Yösönbulag Sum
125
+ - source: Ерөө Сум
126
+ expected: Yöröö Sum
127
+ - source: Есөнзүйл Сум
128
+ expected: Yösöndzüyl Sum
129
+ - source: Ноён Сум
130
+ expected: Noyon Sum
131
+ - source: Родник Балянгийн-Булак
132
+ expected: Rodnik Balyangiyn-Bulak
133
+ - source: Замын-Үүд Сум
134
+ expected: Dzamïn-Üüd Sum
135
+ - source: Адаацаг Сум
136
+ expected: Adaatsag Sum
137
+ - source: Чандмань Сум
138
+ expected: Chandmanĭ Sum
139
+ - source: Хяргас Сум
140
+ expected: Hyargas Sum
141
+
142
+ map:
143
+ rules:
144
+ - pattern: \u042e(?=[АаОоУу]) # Ю before а, о, or у
145
+ result: "Yu"
146
+ - pattern: \u044e(?=[АаОоУу]) # ю before а, о, or у
147
+ result: "yu"
148
+ - pattern: \u042e(?=[ИиЭэӨөҮү]) # Ю before и, э, ө, or ү
149
+ result: "Yü"
150
+ - pattern: \u044e(?=[ИиЭэӨөҮү]) # ю before и, э, ө, or ү
151
+ result: "yü"
152
+
153
+ characters:
154
+ "А": "A" # \u0410
155
+ "Б": "B" # \u0411
156
+ "В": "V" # \u0412
157
+ "Г": "G" # \u0413
158
+ "Д": "D" # \u0414
159
+ "Е": "Yö" # \u0415
160
+ "Ё": "Yo" # \u0401
161
+ "Ж": "J" # \u0416
162
+ "З": "Dz" # \u0417
163
+ "И": "I" # \u0418
164
+ "Й": "Y" # \u0419
165
+ "К": "K" # \u041a
166
+ "Л": "L" # \u041b
167
+ "М": "M" # \u041c
168
+ "Н": "N" # \u041d
169
+ "О": "O" # \u041e
170
+ "Ө": "Ö" # \u04e8
171
+ "П": "P" # \u041f
172
+ "Р": "R" # \u0420
173
+ "С": "S" # \u0421
174
+ "Т": "T" # \u0422
175
+ "У": "U" # \u0423
176
+ "Ү": "Ü" # \u04ae
177
+ "Ф": "F" # \u0424
178
+ "Х": "H" # \u0425
179
+ "Ц": "Ts" # \u0426
180
+ "Ч": "Ch" # \u0427
181
+ "Ш": "Sh" # \u0428
182
+ "Щ": "Shch" # \u0429
183
+ "Ъ": "\u2019" # \u042a
184
+ "Ы": "Ï" # \u042b
185
+ "Ь": "Ĭ" # \u042c
186
+ "Э": "E" # \u042d
187
+ "Ю": "Yu" # \u042e
188
+ "Я": "Ya" # \u042f
189
+ "а": "a" # \u0430
190
+ "б": "b" # \u0431
191
+ "в": "v" # \u0432
192
+ "г": "g" # \u0433
193
+ "д": "d" # \u0434
194
+ "е": "yö" # \u0435
195
+ "ё": "yo" # \u0451
196
+ "ж": "j" # \u0436
197
+ "з": "dz" # \u0437
198
+ "и": "i" # \u0438
199
+ "й": "y" # \u0439
200
+ "к": "k" # \u043a
201
+ "л": "l" # \u043b
202
+ "м": "m" # \u043c
203
+ "н": "n" # \u043d
204
+ "о": "o" # \u043e
205
+ "ө": "ö" # \u04e9
206
+ "п": "p" # \u043f
207
+ "р": "r" # \u0440
208
+ "с": "s" # \u0441
209
+ "т": "t" # \u0442
210
+ "у": "u" # \u0443
211
+ "ү": "ü" # \u04af
212
+ "ф": "f" # \u0444
213
+ "х": "h" # \u0445
214
+ "ц": "ts" # \u0446
215
+ "ч": "ch" # \u0447
216
+ "ш": "sh" # \u0448
217
+ "щ": "shch" # \u0449
218
+ "ъ": "\u2019" # \u044a
219
+ "ы": "ï" # \u044b
220
+ "ь": "ĭ" # \u044c
221
+ "э": "e" # \u044d
222
+ "ю": "yu" # \u044e
223
+ "я": "ya" # \u044f
@@ -0,0 +1,230 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2020
4
+ language: iso-639-2:nep
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Nepali Romanization, 2020
8
+ url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20NEPALI.pdf
9
+ creation_date: 1964
10
+ description: |
11
+ BGN/PCGN 2011 Agreement Romanization of Nepali
12
+ The BGN and the PCGN have adopted the Nepal Survey Department (NSD) system for the
13
+ romanization of Nepali names. This system, below, should be applied to Nepali names for which Roman‐
14
+ script spellings in materials produced by the government of Nepal are not available.
15
+
16
+ notes:
17
+
18
+ - Only the isolated forms of the characters are given in the consonant table. See any grammar of Nepali
19
+ (or other language using the Devanagari alphabet) for variant forms used in conjunct characters.
20
+ - These two consonant characters appear sometimes to represent ṛ (cerebral r), e.g., पहाड → pahāṛ
21
+ instead of pahāḍ. At one time they were written with dots below, i.e., as ड़ and ढ़, though this is no
22
+ longer normal practice in Nepali. The romanizations ṛ and ṛh, respectively, are optional for
23
+ documentary purposes if such dots appear in Nepali writing.
24
+ - व , can be romanized as either v or w. This character is primarily
25
+ romanized as v in consonant initial, medial, and final position; however, initial, medial, and final w
26
+ romanizations can occur. The w romanization is a special case which is believed to be dependent on
27
+ dialect, pronunciation, or stress.
28
+ - |
29
+ An inventory of letter‐diacritic combinations, with their Unicode encoding, in addition to the unmodified letters of the basic Roman script is:
30
+ Ṅ(U+1E44) ṅ (U+1E45)
31
+ Ñ (U+00D1) ñ (U+00F1)
32
+ Ṭ (1E6C) ṭ (1E6D)
33
+ Ḍ (1E0C) ḍ (1E0D)
34
+ Ṇ (1E46) ṇ (1E47)
35
+ Ṣ (1E62) ṣ (1E63)
36
+ Ā (U+0100) ā (U+0101)
37
+ Ī (U+012A) ī (U+012B)
38
+ Ū (U+016A) ū (U+016B)
39
+ Ṛ (1E5A) ṛ (1E5B)
40
+
41
+ - The Romanization column shows only lowercase forms but, when romanizing, uppercase and lowercase
42
+ Roman letters as appropriate should be used.
43
+
44
+ - |
45
+ ं (anusvara) is rendered by
46
+ ṅ before क, ख, ग, and घ
47
+ ñ before च, छ, ज, and झ
48
+ ṇ before ट, ठ, ड, and ढ
49
+ n before त, थ, द, and ध
50
+ ṁ before य, र, ल, व, श, ष, स and ह
51
+
52
+ tests:
53
+ - source: "लेखन"
54
+ expected: "lekhn"
55
+ - source: "मुद्रा"
56
+ expected: "mudarā"
57
+ - source: "प्रशंसा"
58
+ expected: "parshṃsā" # note 5 rule checking
59
+ - source: "अंक"
60
+ expected: "aṅk" # note 5 rule checking
61
+ - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
62
+ expected: "nekpāle sathgit sathāyī kmiṭīko baiṭhk bhdau gte bolāune bheko"
63
+ - source: "न घर रह्यो, न परिवार"
64
+ expected: "n ghr rhayo, n privār"
65
+ - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
66
+ expected: "ḍhorpāṭnmā bhujīkholā bāḍhīphirole abhibhāvk gumāekā bālbālikāko bichlalī"
67
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
68
+ expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
69
+ - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
70
+ expected: "sṃvidhān jārī bhes~gai sāravjnik parshāsnmā nyā~ utasāh āune apekṣā thiyo"
71
+ - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
72
+ expected: "deshmā koronā sṅkarmit r mṛitkko sṅkhayā hrek din bḍhado chh"
73
+ - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
74
+ expected: "gāu~pālikākā adhaykṣ ṭikā guruṅkā anusār viṣaṇudāslāī rājule sutankā lāgi belukā sāthī lgekā thie"
75
+ - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
76
+ expected: "yo āyojnā gāu~pālikāko kenadar telalokmā prachh"
77
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
78
+ expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
79
+ - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
80
+ expected: "chait philo sātā ghr āekā unī lkḍāun bhepchhi ytai rokie"
81
+ - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
82
+ expected: "kām gran jāneko hkmā rojgārdātā kmapnīko ptrs~gai vḍā r jilalā parshāsnko siphāris anivāray grieko chh"
83
+ - source: "दुःख"
84
+ expected: "duḥkh"
85
+ - source: "निकुञ्जको स्थानीय पोस्टका कर्मचारी पनि त्यहीँ थिए"
86
+ expected: "nikuñajko sathānīy posaṭkā kramchārī pni tayhī~ thie"
87
+ - source: "युद्धकालको मनोविज्ञान"
88
+ expected: "yudadhkālko mnovijñān"
89
+ - source: "जर्मन वायुसेवाको आक्रमणमा दुई लाख पचास हजार मानिसको ज्यान जानसक्ने र करिब ३० देखि ४० लाख मान्छे विस्थापित हुने अनुमान बेलायत सरकारको थियो"
90
+ expected: "jramn vāyusevāko ākarmṇmā duī lākh pchās hjār mānisko jayān jānskane r krib 30 dekhi 40 lākh mānachhe visathāpit hune anumān belāyt srkārko thiyo"
91
+ - source: "युद्ध"
92
+ expected: "yudadh"
93
+ - source: "कोरोनासँग जम्काभेट"
94
+ expected: "koronās~g jmakābheṭ"
95
+ - source: "संक्रमित"
96
+ expected: "sṅkarmit"
97
+ - source: "स्वयम्"
98
+ expected: "savyma"
99
+ - source: "संख्या"
100
+ expected: "sṅkhayā"
101
+ - source: "गौरीटारस्थित रंगशाला"
102
+ expected: "gaurīṭārsathit rṅgshālā"
103
+
104
+ map:
105
+
106
+ rules:
107
+ # note[5]
108
+ - pattern: \u0902(?=[कखगघ]) # ं before क, ख, ग, and घ
109
+ result: ṅ
110
+ - pattern: \u0902(?=[चछजझ]) # ं before च, छ, ज, and झ
111
+ result: ñ
112
+ - pattern: \u0902(?=[टठडढ]) # ं before ट, ठ, ड, and ढ
113
+ result: ṇ
114
+ - pattern: \u0902(?=[तथदध]) # ं before त, थ, द, and ध
115
+ result: n
116
+
117
+ characters:
118
+
119
+ # Vowels and Diphthongs
120
+
121
+ 'अ': 'a'
122
+ 'आ': 'ā'
123
+ 'इ': 'i'
124
+ 'ई': 'ī'
125
+ 'उ': 'u'
126
+ 'ऊ': 'ū'
127
+ 'ऋ': 'ṛi'
128
+ 'ॠ': 'rī'
129
+ 'ए': 'e'
130
+ 'ऐ': 'ai'
131
+ 'ओ': 'o'
132
+ 'औ': 'au'
133
+
134
+ # Medials # Needed for connecting constants
135
+
136
+ 'ा': "ā"
137
+ 'ि': "i"
138
+ 'ी': "ī"
139
+ 'ु': "u"
140
+ 'ू': "ū"
141
+ 'ृ': "ṛi"
142
+ 'ॄ': "rī"
143
+ 'े': "e"
144
+ 'ै': "ai"
145
+ 'ो': "o"
146
+ 'ौ': "au"
147
+
148
+
149
+ # Consonants (see Note 1)
150
+
151
+ # Gutturals
152
+ 'क': 'k'
153
+ 'ख': 'kh'
154
+ 'ग': 'g'
155
+ 'घ': 'gh'
156
+ 'ङ': 'ṅ'
157
+
158
+ # Palatals
159
+ 'च': 'ch'
160
+ 'छ': 'chh'
161
+ 'ज': 'j'
162
+ 'झ': 'jh'
163
+ 'ञ': 'ñ'
164
+
165
+ # Cerebrals
166
+ 'ट': 'ṭ'
167
+ 'ठ': 'ṭh'
168
+ 'ड': 'ḍ'
169
+ 'ढ': 'ḍh'
170
+ 'ण': 'ṇ'
171
+
172
+ # Dentals
173
+ 'त': 't'
174
+ 'थ': 'th'
175
+ 'द': 'd'
176
+ 'ध': 'dh'
177
+ 'न': 'n'
178
+
179
+ # Labials
180
+ 'प': 'p'
181
+ 'फ': 'ph'
182
+ 'ब': 'b'
183
+ 'भ': 'bh'
184
+ 'म': 'm'
185
+
186
+ # Semivowels
187
+ 'य': 'y'
188
+ 'र': 'r'
189
+ 'ल': 'l'
190
+ 'व': 'v' # or wa [Note#3]
191
+
192
+ # Sibilants
193
+ 'श': 'sh'
194
+ 'ष': 'ṣ'
195
+ 'स': 's'
196
+ 'क्ष': 'kṣ'
197
+ 'त्र': 'tr'
198
+ 'ज्ञ' : 'jñ'
199
+
200
+ # Aspirate
201
+ 'ह': 'h'
202
+
203
+ # Anusvāra
204
+ 'ं': 'ṃ'
205
+
206
+ # Bisarga
207
+ 'ः': 'ḥ'
208
+
209
+ # Anunāsika
210
+ 'ँ': '~'
211
+
212
+ 'ॅ': 'r'
213
+
214
+ # halanta
215
+ '्': 'a'
216
+
217
+ # Abagraha
218
+ 'ऽ': '’' # (apostrophe)
219
+
220
+ # Numerals / सङ्ख्या
221
+ '०': '0'
222
+ '१': '1'
223
+ '२': '2'
224
+ '३': '3'
225
+ '४': '4'
226
+ '५': '5'
227
+ '६': '6'
228
+ '७': '7'
229
+ '८': '8'
230
+ '९': '9'