interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,100 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Hindi"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Hindi system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
54
+ expected: "gambhīra marījoṃ ke māmale meṃ bhārata dūsare nambara para"
55
+ - source: "कोरोना अपडेट्स"
56
+ expected: "koronā apaḍeṭsa"
57
+ - source: "सीडीसी चीफ का बयान अहम"
58
+ expected: "sīḍīsī cīpha kā bayāna ahama"
59
+ - source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
60
+ expected: "gūgala ple sṭora para peṭīema kī vāpasī"
61
+ - source: "भारत में गैंबलिंग की इजाजत नहीं"
62
+ expected: "bhārata meṃ gaimbaliṅga kī ijājata nahīṃ"
63
+ - source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
64
+ expected: "koronā vaiksīna mudde para ghire rāṣṭrapati; jo bāiḍena bole- mujhe aura deśa ko vaijñānikoṃ para bharosā hai, ḍonālḍa ṭrampa para nahīṃ"
65
+ - source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
66
+ expected: "gūgala kī kārravāī para peṭīema ne kahā thā ki aipa ko asthāyī taura para ple-sṭora se haṭāyā gayā hai, āpake paise surakṣita haiṃ"
67
+ - source: "०१९८"
68
+ expected: "0198"
69
+
70
+
71
+ map:
72
+
73
+ inherit: din-san-Deva-Latn-33904-2018
74
+
75
+ characters:
76
+
77
+ 'ॲ': 'ê'
78
+ 'ऑ': 'ô'
79
+
80
+ # Dotted variants
81
+ 'क़': 'ḵa'
82
+ 'ख़': 'ḵha'
83
+ 'ग़': 'g̲a' # \u0067 + \u0332
84
+ 'ज़': 'j̲a' # \u006a + \u0332
85
+ 'ड़': 'ṙa'
86
+ 'ढ़': 'ṙha'
87
+ 'फ़': 'p̲ha' # \u0070 + \u0332
88
+ 'स़': 's̲a' # \u0073 + \u0332
89
+ 'ह़': 'h̲a' # \u0068 + \u0332
90
+
91
+ # Dotted variants Virāma
92
+ 'क़्': 'ḵ'
93
+ 'ख़्': 'ḵh'
94
+ 'ग़्': 'g̲' # \u0067 + \u0332
95
+ 'ज़्': 'j̲' # \u006a + \u0332
96
+ 'ड़्': 'ṙ'
97
+ 'ढ़्': 'ṙh'
98
+ 'फ़्': 'p̲h' # \u0070 + \u0332
99
+ 'स़्': 's̲' # \u0073 + \u0332
100
+ 'ह़्': 'h̲' # \u0068 + \u0332
@@ -0,0 +1,145 @@
1
+ ---
2
+ authority_id: din
3
+ id: 32707-2010
4
+ language: iso-639-2:kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: "DIN 32707:2010-01 Information und Dokumentation - Umschrift des georgischen Alphabets"
8
+ url: https://www.beuth.de/de/norm/din-32707/122821999
9
+ creation_date: 2010
10
+ confirmation_date: 2010
11
+ description: |
12
+ Information and documentation - Romanization of the Georgian alphabet.
13
+
14
+ notes:
15
+
16
+ tests:
17
+
18
+ - source: ხაოფსე
19
+ expected: xaop̕se
20
+
21
+ - source: ჭლოუ
22
+ expected: člou
23
+
24
+ - source: ჩოხულდი
25
+ expected: č̕oxuldi
26
+
27
+ - source: ქვემო ლინდა
28
+ expected: k̕vemo linda
29
+
30
+ - source: ტამკვაჩ იგვავერა
31
+ expected: tamkvač̕ igvavera
32
+
33
+ - source: სვანეთი
34
+ expected: svanet̕i
35
+
36
+ - source: საცხვარისი
37
+ expected: sac̕xvarisi
38
+
39
+ - source: მუხრან-თელეთი
40
+ expected: muxran-t̕elet̕i
41
+
42
+ - source: მუცდი
43
+ expected: muc̕di
44
+
45
+ - source: ლეჩხუმი
46
+ expected: leč̕xumi
47
+
48
+ - source: ვერხნაია მწარა
49
+ expected: verxnaia mcara
50
+
51
+ - source: ეგრისის ქედი
52
+ expected: egrisis k̕edi
53
+
54
+ - source: დოჩარიფშა
55
+ expected: doč̕arip̕ša
56
+
57
+ - source: ბოლოკო
58
+ expected: boloko
59
+
60
+ - source: აჭანდარა
61
+ expected: ačandara
62
+
63
+ - source: აუალიცა
64
+ expected: aualic̕a
65
+
66
+ - source: აკალამრა
67
+ expected: akalamra
68
+
69
+ - source: ლასილი
70
+ expected: lasili
71
+
72
+ - source: გუბაზეული
73
+ expected: gubazeuli
74
+
75
+ - source: ბაყაყი
76
+ expected: baqaqi
77
+
78
+ - source: ძროხა
79
+ expected: jroxa
80
+
81
+ - source: ჰაერი
82
+ expected: haeri
83
+
84
+ - source: ჟოლო
85
+ expected: žolo
86
+
87
+ - source: ჯართი
88
+ expected: ǰart̕i
89
+
90
+ - source: ღრმაღელე
91
+ expected: ġrmaġele
92
+
93
+ map:
94
+ characters:
95
+ '\u10d0' : 'a' # ა
96
+ '\u10d1' : 'b' # ბ
97
+ '\u10d2' : 'g' # გ
98
+ '\u10d3' : 'd' # დ
99
+ '\u10d4' : 'e' # ე
100
+ '\u10d5' : 'v' # ვ
101
+ '\u10d6' : 'z' # ზ
102
+
103
+ '\u10f1' : 'ê' # ჱ
104
+
105
+ '\u10d7' : 't̕' # თ
106
+ '\u10d8' : 'i' # ი
107
+ '\u10d9' : 'k' # კ
108
+ '\u10da' : 'l' # ლ
109
+ '\u10db' : 'm' # მ
110
+ '\u10dc' : 'n' # ნ
111
+
112
+ '\u10f2' : 'y' # ჲ
113
+
114
+ '\u10dd' : 'o' # ო
115
+ '\u10de' : 'p' # პ
116
+ '\u10df' : 'ž' # ჟ
117
+ '\u10e0' : 'r' # რ
118
+ '\u10e1' : 's' # ს
119
+ '\u10e2' : 't' # ტ
120
+
121
+ '\u10f3' : 'w' # ჳ
122
+
123
+ '\u10e3' : 'u' # უ
124
+ '\u10e4' : 'p̕' # ფ
125
+ '\u10e5' : 'k̕' # ქ
126
+ '\u10e6' : 'ġ' # ღ
127
+ '\u10e7' : 'q' # ყ
128
+ '\u10e8' : 'š' # შ
129
+ '\u10e9' : 'č̕' # ჩ
130
+ '\u10ea' : 'c̕' # ც
131
+ '\u10eb' : 'j' # ძ
132
+ '\u10ec' : 'c' # წ
133
+ '\u10ed' : 'č' # ჭ
134
+ '\u10ee' : 'x' # ხ
135
+
136
+ '\u10f4' : 'q̕' # ჴ
137
+
138
+ '\u10ef' : 'ǰ' # ჯ
139
+ '\u10f0' : 'h' # ჰ
140
+
141
+ '\u10f5' : 'ô' # ჵ
142
+
143
+ '\u10f6' : 'f' # ჶ
144
+ '\u10f7' : 'ẹ' # ჷ
145
+ '\u10f8' : 'ʼ' # ჸ
@@ -0,0 +1,84 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:mar
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Marathi"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Marathi system.
12
+
13
+ Information und Dokumentation - Transliteration Devanagari
14
+
15
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
16
+ It is suitable for any application.
17
+
18
+ notes:
19
+ - |
20
+ Vowels:
21
+ The Ardhacandra ॅ is often used to denote English vowels:
22
+ EXAMPLE
23
+ बॅट bêṭa (bat)
24
+ डॉक्टर ḍôkṭara (doctor)
25
+ - |
26
+ Consonants:
27
+
28
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
29
+ Always written during transliteration, also in the final part
30
+ EXAMPLE 1
31
+ पुस्तक pustaka
32
+
33
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
34
+ EXAMPLE 2
35
+ वाक् vāk
36
+
37
+ The anusvāra is always represented with -ṃ-.
38
+ EXAMPLE 3
39
+ संसकरण saṃskaraṇa
40
+
41
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
42
+ EXAMPLE 4
43
+ तंघी kaṃghī becomes kaṅghī
44
+ पंजाबी paṃjābī becomes pañjābī
45
+ पंडित paṃḍita becomes paṇḍita
46
+ संधी saṃdhī becomes sandhī
47
+ दिसंबर disaṃbara becomes disambara
48
+
49
+ Anunāsika or Candrabindu signals the nasalization of vowels
50
+
51
+ EXAMPLE 5
52
+ माँ māṁ
53
+
54
+ tests:
55
+ - source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
56
+ expected: "ṭhāṇe - jilhyāta budhavārī eka hajāra rugṇāñcī vāḍha, tara jaṇāñcyā mṛtyūcī nonda"
57
+ - source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
58
+ expected: "ekatā kapūra punhā aḍakalī vādāta, vebasīrijamadhalyā 'tyā' sīnamuḷe jamāvācī gharāvara dagaḍapheka"
59
+ - source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
60
+ expected: "jāṇūna ghyā, bīemasīcyā adhikāऱ्yānnī kaṅganā rāṇautacyā ôphisamadhale nakkī kāya- kāya toḍalaṃ"
61
+ - source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
62
+ expected: "kaṅganā mumbaīta dākhala hoṇyāpūrvī 'mātośrī'varūna pharmāna suṭale; pravaktyānnā sakta ādeśa"
63
+ - source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
64
+ expected: "marāṭhā ārakṣaṇāsa tātpuratī sthagitī; sarvocca nyāyālayācā nirṇaya"
65
+ - source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
66
+ expected: "bhāratācyā tinhī laśīñcā pahilā ṭappā yaśasvī, vācā kadhī yeṇāra bājārāta"
67
+ - source: "रुग्णवाढीमुळे खाटांची चणचण"
68
+ expected: "rugṇavāḍhīmuḷe khāṭāñcī caṇacaṇa"
69
+ - source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
70
+ expected: "pīema svanidhī karja yojanelā mumbaītūna alpa pratisāda"
71
+ - source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
72
+ expected: "sāntākrūjha-cembūra liṅka roḍavarīla unnata mārgālā sthagitī"
73
+ - source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
74
+ expected: "sampādaka arṇaba gosvāmī yāñcyāvirūddha khaḍaka polisa ṭhāṇyāta takrāra"
75
+
76
+
77
+ map:
78
+
79
+ inherit: 'din-san-Deva-Latn-33904-2018'
80
+
81
+ characters:
82
+
83
+ 'ॲ': 'ê'
84
+ 'ऑ': 'ô'
@@ -0,0 +1,119 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:nep
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Nepali"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Nepali system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "लेखन"
54
+ expected: "lekhana"
55
+ - source: "मुद्रा"
56
+ expected: "mudrā"
57
+ - source: "प्रशंसा"
58
+ expected: "praśaṃsā"
59
+ - source: "अंक"
60
+ expected: "aṅka"
61
+ - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
62
+ expected: "nekapāle sthagita sthāyī kamiṭīko baiṭhaka bhadau gate bolāune bhaeko"
63
+ - source: "न घर रह्यो, न परिवार"
64
+ expected: "na ghara rahyo, na parivāra"
65
+ - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
66
+ expected: "ḍhorapāṭanamā bhujīkholā bāḍhīpahirole abhibhāvaka gumāekā bālabālikāko bicallī"
67
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
68
+ expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
69
+ - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
70
+ expected: "saṃvidhāna jārī bhaesaṁgai sārvajanika praśāsanamā nayāṁ utsāha āune apekṣā thiyo"
71
+ - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
72
+ expected: "deśamā koronā saṅkramita ra mṛtakako saṅkhyā hareka dina baḍhdo cha"
73
+ - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
74
+ expected: "gāuṁpālikākā adhyakṣa ṭikā guruṅakā anusāra viṣṇudāsalāī rājule sutnakā lāgi belukā sāthī lagekā thie"
75
+ - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
76
+ expected: "yo āyojanā gāuṁpālikāko kendra tellokamā parcha"
77
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
78
+ expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
79
+ - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
80
+ expected: "caita pahilo sātā ghara āekā unī lakaḍāuna bhaepachi yatai rokie"
81
+ - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
82
+ expected: "kāma garna jāneko hakamā rojagāradātā kampanīko patrasaṁgai vaḍā ra jillā praśāsanako siphārisa anivārya garieko cha"
83
+ - source: "दुःख"
84
+ expected: "duḥkha"
85
+
86
+
87
+ map:
88
+
89
+ inherit: 'din-san-Deva-Latn-33904-2018'
90
+
91
+ characters:
92
+
93
+ 'ॲ': 'ê'
94
+ 'ऑ': 'ô'
95
+
96
+ # Dotted variants
97
+ 'क़': 'ḵa'
98
+ 'ख़': 'ḵha'
99
+ 'ग़': 'g̲a' # \u0067 + \u0332
100
+ 'ज़': 'j̲a' # \u006a + \u0332
101
+ 'ड़': 'ṙa'
102
+ 'ढ़': 'ṙha'
103
+ 'फ़': 'p̲ha' # \u0070 + \u0332
104
+ 'स़': 's̲a' # \u0073 + \u0332
105
+ 'ह़': 'h̲a' # \u0068 + \u0332
106
+ 'व़': 'v̲a' # \u0076 + \u0332
107
+
108
+ # Dotted variants Virāma
109
+ 'क़्': 'ḵ'
110
+ 'ख़्': 'ḵh'
111
+ 'ग़्': 'g̲' # \u0067 + \u0332
112
+ 'ज़्': 'j̲' # \u006a + \u0332
113
+ 'ड़्': 'ṙ'
114
+ 'ढ़्': 'ṙh'
115
+ 'फ़्': 'p̲h' # \u0070 + \u0332
116
+ 'स़्': 's̲' # \u0073 + \u0332
117
+ 'ह़्': 'h̲' # \u0068 + \u0332
118
+
119
+