interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,75 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:pli
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Pali"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Pali system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "तेन खो पन समयेन वेसालिया अविदूरे कलन्दगामो नाम अत्थि"
54
+ expected: "tena kho pana samayena vesāliyā avidūre kalandagāmo nāma atthi"
55
+ - source: "तत्थ सुदिन्‍नो नाम कलन्दपुत्तो सेट्ठिपुत्तो होति"
56
+ expected: "tattha sudinno nāma kalandaputto seṭṭhiputto hoti"
57
+ - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो सम्बहुलेहि"
58
+ expected: "atha kho sudinno kalandaputto sambahulehi"
59
+ - source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
60
+ expected: "tathā caturbhiḥ puruṣaḥ parīkṣyate tyāgena śīlena guṇena karmaṇā"
61
+ - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो अचिरवुट्ठिताय परिसाय येन भगवा तेनुपसङ्कमि; उपसङ्कमित्वा भगवन्तं अभिवादेत्वा एकमन्तं निसीदि"
62
+ expected: "atha kho sudinno kalandaputto aciravuṭṭhitāya parisāya yena bhagavā tenupasaṅkami; upasaṅkamitvā bhagavantaṃ abhivādetvā ekamantaṃ nisīdi"
63
+ - source: "अथ खो सुदिन्‍नस्स कलन्दपुत्तस्स मातापितरो सुदिन्‍नं कलन्दपुत्तं एतदवोचुं"
64
+ expected: "atha kho sudinnassa kalandaputtassa mātāpitaro sudinnaṃ kalandaputtaṃ etadavocuṃ"
65
+ - source: "त्वं खोसि, तात सुदिन्‍न, अम्हाकं एकपुत्तको पियो मनापो सुखेधितो सुखपरिहतो"
66
+ expected: "tvaṃ khosi, tāta sudinna, amhākaṃ ekaputtako piyo manāpo sukhedhito sukhaparihato"
67
+ - source: "न त्वं, तात सुदिन्‍न, किञ्‍चि दुक्खस्स जानासि"
68
+ expected: "na tvaṃ, tāta sudinna, kiñci dukkhassa jānāsi"
69
+ - source: "अनुञ्‍ञातोम्हि किर मातापितूहि अगारस्मा अनगारियं पब्बज्‍जाया’’ति, हट्ठो उदग्गो पाणिना गत्तानि परिपुञ्छन्तो वुट्ठासि"
70
+ expected: "anuññātomhi kira mātāpitūhi agārasmā anagāriyaṃ pabbajjāyā’’ti, haṭṭho udaggo pāṇinā gattāni paripuñchanto vuṭṭhāsi"
71
+
72
+
73
+ map:
74
+
75
+ inherit: 'din-san-Deva-Latn-33904-2018'
@@ -0,0 +1,63 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:pra
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Prakit"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Prakit system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
54
+ expected: "sṛṣṭisthitivināśānāṃ śaktibhūte sanātani"
55
+ - source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
56
+ expected: "guṇāśraye guṇamaye nārāyaṇi namo’stu te"
57
+ - source: "तेन समयेन बुद्धो भगवा सावत्थियं विहरति जेतवने अनाथपिण्डिकस्स आरामे"
58
+ expected: "tena samayena buddho bhagavā sāvatthiyaṃ viharati jetavane anāthapiṇḍikassa ārāme"
59
+
60
+
61
+ map:
62
+
63
+ inherit: 'din-san-Deva-Latn-33904-2018'
@@ -0,0 +1,338 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:san
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Sanskrit"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Sanskrit system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "पुस्तक"
54
+ expected: "pustaka"
55
+ - source: "बॅट"
56
+ expected: "bêṭa"
57
+ - source: "वाक्"
58
+ expected: "vāk"
59
+ - source: "पंजाबी"
60
+ expected: "pañjābī"
61
+ - source: "डॉक्टर"
62
+ expected: "ḍôkṭara"
63
+ - source: "पंडित"
64
+ expected: "paṇḍita"
65
+ - source: "संधी"
66
+ expected: "sandhī"
67
+ - source: "दिसंबर"
68
+ expected: "disambara"
69
+ - source: "संसकरण"
70
+ expected: "saṃsakaraṇa"
71
+ - source: "माँ"
72
+ expected: "māṁ"
73
+ - source: "शुभाशुभपरित्यागी भक्तिमान्यः स मे प्रियः"
74
+ expected: "śubhāśubhaparityāgī bhaktimānyaḥ sa me priyaḥ"
75
+ - source: "सत्य -सत्यमेवेश्वरो लोके सत्ये धर्मः सदाश्रितः"
76
+ expected: "satya -satyameveśvaro loke satye dharmaḥ sadāśritaḥ"
77
+ - source: "सत्यमूलनि सर्वाणि सत्यान्नास्ति परं पदम्"
78
+ expected: "satyamūlani sarvāṇi satyānnāsti paraṃ padam"
79
+ - source: "पिता माताग्निरात्मा च गुरुश्च भरतर्षभ"
80
+ expected: "pitā mātāgnirātmā ca guruśca bharatarṣabha"
81
+ - source: "०१२३४५६७८९"
82
+ expected: "0123456789"
83
+
84
+ map:
85
+
86
+ rules:
87
+ - pattern: \u0902(?=[कक़खख़गग़घङ])
88
+ result: ṅ
89
+ - pattern: \u0902(?=[चछजज़झञ])
90
+ result: ñ
91
+ - pattern: \u0902(?=[टट़ठडड़ढढ़ण])
92
+ result: ṇ
93
+ - pattern: \u0902(?=[तथदधन])
94
+ result: n
95
+ - pattern: \u0902(?=[पफबभम])
96
+ result: m
97
+
98
+ - pattern: \u0902(?=[कखगघचछजझतथदधपफबभटठडढ])
99
+ result: "ñ"
100
+
101
+ - pattern: ([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
102
+ result: 'k'
103
+ - pattern: ([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
104
+ result: 'kh'
105
+ - pattern: ([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
106
+ result: 'g'
107
+ - pattern: ([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
108
+ result: 'gh'
109
+ - pattern: ([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
110
+ result: 'ṅ'
111
+ - pattern: ([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
112
+ result: 'c'
113
+ - pattern: ([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
114
+ result: 'ch'
115
+ - pattern: ([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
116
+ result: 'j'
117
+ - pattern: ([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
118
+ result: 'jh'
119
+ - pattern: ([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
120
+ result: 'ñ'
121
+ - pattern: ([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
122
+ result: 'ṭ'
123
+ - pattern: ([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
124
+ result: 'ṭh'
125
+ - pattern: ([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
126
+ result: 'ḍ'
127
+ - pattern: ([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
128
+ result: 'ḍh'
129
+ - pattern: ([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
130
+ result: 'ṇ'
131
+ - pattern: ([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
132
+ result: 't'
133
+ - pattern: ([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
134
+ result: 'th'
135
+ - pattern: ([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
136
+ result: 'd'
137
+ - pattern: ([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
138
+ result: 'dh'
139
+ - pattern: ([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
140
+ result: 'n'
141
+ - pattern: ([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
142
+ result: 'p'
143
+ - pattern: ([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
144
+ result: 'ph'
145
+ - pattern: ([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
146
+ result: 'b'
147
+ - pattern: ([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
148
+ result: 'bh'
149
+ - pattern: ([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
150
+ result: 'm'
151
+ - pattern: ([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
152
+ result: 'y'
153
+ - pattern: ([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
154
+ result: 'r'
155
+ - pattern: ([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
156
+ result: 'l'
157
+ - pattern: ([ळ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
158
+ result: 'ḷ'
159
+ - pattern: ([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
160
+ result: 'v'
161
+ - pattern: ([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
162
+ result: 'ś'
163
+ - pattern: ([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
164
+ result: 'ṣ'
165
+ - pattern: ([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
166
+ result: 's'
167
+ - pattern: ([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
168
+ result: 'h'
169
+
170
+ characters:
171
+
172
+ # I. Vowels and Diphthongs (see Note 1)
173
+
174
+ 'अ': 'a'
175
+ 'आ': 'ā'
176
+ 'इ': 'i'
177
+ 'ई': 'ī'
178
+ 'उ': 'u'
179
+ 'ऊ': 'ū'
180
+ 'ऋ': 'ṛ'
181
+ 'ॠ': 'ṝ'
182
+ 'ऌ': 'ḷ'
183
+ 'ए': 'e'
184
+ 'ऎ': 'ĕ'
185
+ 'ऐ': 'ai'
186
+ 'ओ': 'o'
187
+ 'ऒ': 'ŏ'
188
+ 'औ': 'au'
189
+
190
+
191
+ # II. Consonants (see Note 2)
192
+ # Gutturals
193
+ 'क': 'ka'
194
+ 'ख': 'kha'
195
+ 'ग': 'ga'
196
+ 'घ': 'gha'
197
+ 'ङ': 'ṅa'
198
+
199
+ # Palatals
200
+ 'च': 'ca'
201
+ 'छ': 'cha'
202
+ 'ज': 'ja'
203
+ 'झ': 'jha'
204
+ 'ञ': 'ña'
205
+
206
+ # Cerebrals
207
+ 'ट': 'ṭa'
208
+ 'ठ': 'ṭha'
209
+ 'ड': 'ḍa'
210
+ 'ढ': 'ḍha'
211
+ 'ण': 'ṇa'
212
+
213
+ # Dentals
214
+ 'त': 'ta'
215
+ 'थ': 'tha'
216
+ 'द': 'da'
217
+ 'ध': 'dha'
218
+ 'न': 'na'
219
+
220
+ # Labials
221
+ 'प': 'pa'
222
+ 'फ': 'pha'
223
+ 'ब': 'ba'
224
+ 'भ': 'bha'
225
+ 'म': 'ma'
226
+
227
+ # Semivowels
228
+ 'य': 'ya'
229
+ 'र': 'ra'
230
+ 'ल': 'la'
231
+ 'ळ': 'ḷa'
232
+ 'व': 'va'
233
+
234
+ # Sibilants
235
+ 'श': 'śa'
236
+ 'ष': 'ṣa'
237
+ 'स': 'sa'
238
+
239
+ # Aspirate
240
+ 'ह': 'ha'
241
+
242
+ # Anusvāra
243
+ 'ं': 'ṃ'
244
+
245
+ # Bisarga
246
+ 'ः': 'ḥ'
247
+
248
+ # Anunāsika
249
+ 'ँ': 'ṁ'
250
+
251
+ # Abagraha
252
+ 'ऽ': '’' # (apostrophe)
253
+
254
+ # Medials # Needed for connecting constants
255
+ 'ा': "ā"
256
+ 'ि': "i"
257
+ 'ी': "ī"
258
+ 'ु': "u"
259
+ 'ू': "ū"
260
+ 'ृ': "ṛ"
261
+ 'ॄ': "ṝ"
262
+ '◌': "ṝ"
263
+ 'ॢ': "ḷ"
264
+ 'ॣ': "ḹ"
265
+ 'े': "e"
266
+ 'ै': "ai"
267
+ 'ो': "o"
268
+ 'ौ': "au"
269
+ 'ॉ': "ô"
270
+ 'ॅ': "ê"
271
+ '‍': ''# Used for joining
272
+
273
+
274
+
275
+ # For consonant Virāma
276
+ # Gutturals
277
+ 'क्': 'k'
278
+ 'ख्': 'kh'
279
+ 'ग्': 'g'
280
+ 'घ्': 'gh'
281
+ 'ङ्': 'ṅ'
282
+
283
+ # Palatals
284
+ 'च्': 'c'
285
+ 'छ्': 'ch'
286
+ 'ज्': 'j'
287
+ 'झ्': 'jh'
288
+ 'ञ्': 'ñ'
289
+
290
+ # Cerebrals
291
+ 'ट्': 'ṭ'
292
+ 'ठ्': 'ṭh'
293
+ 'ड्': 'ḍ'
294
+ 'ढ्': 'ḍh'
295
+ 'ण्': 'ṇ'
296
+
297
+ # Dentals
298
+ 'त्': 't'
299
+ 'थ्': 'th'
300
+ 'द्': 'd'
301
+ 'ध्': 'dh'
302
+ 'न्': 'n'
303
+
304
+ # Labials
305
+ 'प्': 'p'
306
+ 'फ्': 'ph'
307
+ 'ब्': 'b'
308
+ 'भ्': 'bh'
309
+ 'म्': 'm'
310
+
311
+ # Semivowels
312
+ 'य्': 'y'
313
+ 'र्': 'r'
314
+ 'ल्': 'l'
315
+ 'ळ्': 'ḷ'
316
+ 'व्': 'v'
317
+
318
+ # Sibilants
319
+ 'श्': 'ś'
320
+ 'ष्': 'ṣ'
321
+ 'स्': 's'
322
+
323
+ # Aspirate
324
+ 'ह्': 'h'
325
+
326
+ # digits
327
+
328
+ '०': '0'
329
+ '१': '1'
330
+ '२': '2'
331
+ '३': '3'
332
+ '४': '4'
333
+ '५': '5'
334
+ '६': '6'
335
+ '७': '7'
336
+ '८': '8'
337
+ '९': '9'
338
+