interscript 0.1.6 → 0.1.7

Sign up to get free protection for your applications and to get access to all the features.
Files changed (251) hide show
  1. checksums.yaml +4 -4
  2. data/lib/interscript.rb +10 -6
  3. data/lib/interscript/fs.rb +0 -2
  4. data/lib/interscript/mapping.rb +1 -1
  5. data/lib/interscript/opal.rb +38 -8
  6. data/lib/interscript/opal/entrypoint.rb +12 -0
  7. data/lib/interscript/opal/map_translate.rb +7 -0
  8. data/lib/interscript/version.rb +1 -1
  9. data/maps/acadsin-zho-Hani-Latn-2002.yaml +5 -1
  10. data/maps/alalc-amh-Ethi-Latn-1997.yaml +5 -1
  11. data/maps/alalc-amh-Ethi-Latn-2011.yaml +1 -1
  12. data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -1
  13. data/maps/alalc-asm-Deva-Latn-1997.yaml +9 -3
  14. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  15. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +5 -1
  16. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +5 -1
  17. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  18. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  19. data/maps/alalc-ell-Grek-Latn-1997.yaml +5 -1
  20. data/maps/alalc-ell-Grek-Latn-2010.yaml +1 -2
  21. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  22. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  23. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  24. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  25. data/maps/alalc-kat-Geok-Latn-1997.yaml +1 -1
  26. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  27. data/maps/alalc-kor-Hang-Latn-1997.yaml +5 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  29. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  30. data/maps/alalc-mar-Deva-Latn-1997.yaml +21 -2
  31. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  32. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +1 -1
  33. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  34. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  35. data/maps/{alalc-pan-Deva-Latn-1997.yaml → alalc-pan-Guru-Latn-1997.yaml} +23 -4
  36. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  37. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  38. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  39. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  40. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +5 -1
  41. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +1 -1
  42. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  43. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  44. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  45. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  46. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +1 -1
  47. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  48. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  49. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  50. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  51. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  52. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -1
  53. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  54. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -1
  55. data/maps/bgn-kor-Hang-Latn-1943.yaml +7 -3
  56. data/maps/bgn-kor-Kore-Latn-1943.yaml +3 -3
  57. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  58. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  59. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +5 -1
  60. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +5 -1
  61. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  62. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +2 -2
  63. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +6 -2
  64. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +5 -1
  65. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +5 -1
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  67. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  68. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +5 -1
  69. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -1
  70. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -1
  71. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  72. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  73. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +1 -1
  75. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +1 -1
  76. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +1 -1
  77. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  78. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +1 -1
  79. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  80. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +31 -1
  81. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  82. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  83. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  84. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  85. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  86. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  87. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  88. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  89. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -1
  90. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  91. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  92. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  93. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +1 -1
  94. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +1 -1
  95. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +1 -1
  96. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +1 -1
  97. data/maps/{bis-gjr-Gujr-Latn-13194-1991.yaml → bis-guj-Gujr-Latn-13194-1991.yaml} +17 -2
  98. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +1 -1
  99. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +1 -1
  100. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +1 -1
  101. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +1 -1
  102. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +1 -1
  103. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +1 -1
  104. data/maps/by-bel-Cyrl-Latn-1998.yaml +5 -1
  105. data/maps/by-bel-Cyrl-Latn-2007.yaml +1 -1
  106. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  107. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  108. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  109. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  110. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  111. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  112. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  113. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  114. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  115. data/maps/dos-nep-Deva-Latn-1997.yaml +15 -1
  116. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +3 -3
  117. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +2 -2
  118. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -2
  119. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -2
  120. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -1
  121. data/maps/gki-bel-Cyrl-Latn-1992.yaml +1 -1
  122. data/maps/gki-bel-Cyrl-Latn-2000.yaml +1 -1
  123. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +7 -3
  124. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  125. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  126. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -1
  127. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -1
  128. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -1
  129. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  130. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  131. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -1
  132. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  133. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -1
  134. data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
  135. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  136. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  137. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +8 -4
  138. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -4
  139. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  140. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  141. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  142. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  143. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  144. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  145. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  146. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  147. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  148. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  149. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  150. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  151. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  152. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  153. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  154. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  155. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  156. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  157. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  158. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -3
  159. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  160. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  161. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  162. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +1 -1
  163. data/maps/kp-kor-Hang-Latn-2002.yaml +25 -17
  164. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +1 -1
  165. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  166. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  167. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  168. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  169. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  170. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +2 -2
  171. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +3 -3
  172. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +2 -2
  173. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +2 -2
  174. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  175. data/maps/odni-aze-Cyrl-Latn-2015.yaml +1 -1
  176. data/maps/odni-bel-Cyrl-Latn-2015.yaml +1 -1
  177. data/maps/odni-bul-Cyrl-Latn-2015.yaml +2 -2
  178. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  179. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  180. data/maps/odni-hin-Deva-Latn-2015.yaml +1 -1
  181. data/maps/odni-kat-Geor-Latn-2015.yaml +1 -1
  182. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +1 -1
  183. data/maps/odni-kir-Cyrl-Latn-2015.yaml +1 -1
  184. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  185. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +1 -1
  186. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  187. data/maps/odni-rus-Cyrl-Latn-2015.yaml +1 -1
  188. data/maps/odni-srp-Cyrl-Latn-2015.yaml +1 -1
  189. data/maps/odni-tat-Cyrl-Latn-2015.yaml +1 -1
  190. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +1 -1
  191. data/maps/odni-uig-Cyrl-Latn-2015.yaml +1 -1
  192. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +1 -1
  193. data/maps/odni-urd-Arab-Latn-2015.yaml +1 -1
  194. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +1 -1
  195. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +1 -1
  196. data/maps/royin-tha-Thai-Latn-1968.yaml +5 -1
  197. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +1 -1
  198. data/maps/royin-tha-Thai-Latn-1999.yaml +5 -1
  199. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  200. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  201. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  202. data/maps/ses-ara-Arab-Latn-1930.yaml +5 -1
  203. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  204. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  205. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  206. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  207. data/maps/{ungegn-amh-Ethi-Latn-2016.yaml → un-amh-Ethi-Latn-2016.yaml} +51 -24
  208. data/maps/un-ara-Arab-Latn-1971.yaml +1 -1
  209. data/maps/un-ara-Arab-Latn-1972.yaml +1 -1
  210. data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
  211. data/maps/un-bel-Cyrl-Latn-2007.yaml +1 -1
  212. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  213. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +2 -2
  214. data/maps/un-ell-Grek-Latn-1987-tl.yaml +2 -2
  215. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -3
  216. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  217. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  218. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  219. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  220. data/maps/un-nep-Deva-Latn-1972.yaml +204 -17
  221. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  222. data/maps/un-rus-Cyrl-Latn-1987.yaml +1 -1
  223. data/maps/un-ukr-Cyrl-Latn-1998.yaml +35 -12
  224. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  225. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  226. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  227. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  228. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +1 -1
  229. data/maps/var-kor-Hang-Latn-mr-1939.yaml +2 -2
  230. data/maps/var-kor-Kore-Hang-2013.yaml +1 -1
  231. data/maps/var-kor-Kore-Latn-mr-1939.yaml +1 -1
  232. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  233. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  234. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  235. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  236. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  237. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  238. data/maps/var-tha-Thai-Thai-phonemic.yaml +1 -1
  239. data/maps/var-tha-Thai-Zsym-ipa.yaml +1 -1
  240. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +6 -2
  241. data/spec/interscript/filenames_spec.rb +384 -0
  242. data/spec/interscript_spec.rb +7 -4
  243. metadata +105 -26
  244. data/bin/interscript +0 -41
  245. data/bin/rspec +0 -29
  246. data/bin/setup +0 -8
  247. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  248. data/lib/interscript-opal.rb +0 -2
  249. data/lib/interscript/opal_map_translate.rb +0 -12
  250. data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
  251. data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
@@ -0,0 +1,100 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:hin
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Hindi"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Hindi system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
54
+ expected: "gambhīra marījoṃ ke māmale meṃ bhārata dūsare nambara para"
55
+ - source: "कोरोना अपडेट्स"
56
+ expected: "koronā apaḍeṭsa"
57
+ - source: "सीडीसी चीफ का बयान अहम"
58
+ expected: "sīḍīsī cīpha kā bayāna ahama"
59
+ - source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
60
+ expected: "gūgala ple sṭora para peṭīema kī vāpasī"
61
+ - source: "भारत में गैंबलिंग की इजाजत नहीं"
62
+ expected: "bhārata meṃ gaimbaliṅga kī ijājata nahīṃ"
63
+ - source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
64
+ expected: "koronā vaiksīna mudde para ghire rāṣṭrapati; jo bāiḍena bole- mujhe aura deśa ko vaijñānikoṃ para bharosā hai, ḍonālḍa ṭrampa para nahīṃ"
65
+ - source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
66
+ expected: "gūgala kī kārravāī para peṭīema ne kahā thā ki aipa ko asthāyī taura para ple-sṭora se haṭāyā gayā hai, āpake paise surakṣita haiṃ"
67
+ - source: "०१९८"
68
+ expected: "0198"
69
+
70
+
71
+ map:
72
+
73
+ inherit: din-san-Deva-Latn-33904-2018
74
+
75
+ characters:
76
+
77
+ 'ॲ': 'ê'
78
+ 'ऑ': 'ô'
79
+
80
+ # Dotted variants
81
+ 'क़': 'ḵa'
82
+ 'ख़': 'ḵha'
83
+ 'ग़': 'g̲a' # \u0067 + \u0332
84
+ 'ज़': 'j̲a' # \u006a + \u0332
85
+ 'ड़': 'ṙa'
86
+ 'ढ़': 'ṙha'
87
+ 'फ़': 'p̲ha' # \u0070 + \u0332
88
+ 'स़': 's̲a' # \u0073 + \u0332
89
+ 'ह़': 'h̲a' # \u0068 + \u0332
90
+
91
+ # Dotted variants Virāma
92
+ 'क़्': 'ḵ'
93
+ 'ख़्': 'ḵh'
94
+ 'ग़्': 'g̲' # \u0067 + \u0332
95
+ 'ज़्': 'j̲' # \u006a + \u0332
96
+ 'ड़्': 'ṙ'
97
+ 'ढ़्': 'ṙh'
98
+ 'फ़्': 'p̲h' # \u0070 + \u0332
99
+ 'स़्': 's̲' # \u0073 + \u0332
100
+ 'ह़्': 'h̲' # \u0068 + \u0332
@@ -0,0 +1,145 @@
1
+ ---
2
+ authority_id: din
3
+ id: 32707-2010
4
+ language: iso-639-2:kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: "DIN 32707:2010-01 Information und Dokumentation - Umschrift des georgischen Alphabets"
8
+ url: https://www.beuth.de/de/norm/din-32707/122821999
9
+ creation_date: 2010
10
+ confirmation_date: 2010
11
+ description: |
12
+ Information and documentation - Romanization of the Georgian alphabet.
13
+
14
+ notes:
15
+
16
+ tests:
17
+
18
+ - source: ხაოფსე
19
+ expected: xaop̕se
20
+
21
+ - source: ჭლოუ
22
+ expected: člou
23
+
24
+ - source: ჩოხულდი
25
+ expected: č̕oxuldi
26
+
27
+ - source: ქვემო ლინდა
28
+ expected: k̕vemo linda
29
+
30
+ - source: ტამკვაჩ იგვავერა
31
+ expected: tamkvač̕ igvavera
32
+
33
+ - source: სვანეთი
34
+ expected: svanet̕i
35
+
36
+ - source: საცხვარისი
37
+ expected: sac̕xvarisi
38
+
39
+ - source: მუხრან-თელეთი
40
+ expected: muxran-t̕elet̕i
41
+
42
+ - source: მუცდი
43
+ expected: muc̕di
44
+
45
+ - source: ლეჩხუმი
46
+ expected: leč̕xumi
47
+
48
+ - source: ვერხნაია მწარა
49
+ expected: verxnaia mcara
50
+
51
+ - source: ეგრისის ქედი
52
+ expected: egrisis k̕edi
53
+
54
+ - source: დოჩარიფშა
55
+ expected: doč̕arip̕ša
56
+
57
+ - source: ბოლოკო
58
+ expected: boloko
59
+
60
+ - source: აჭანდარა
61
+ expected: ačandara
62
+
63
+ - source: აუალიცა
64
+ expected: aualic̕a
65
+
66
+ - source: აკალამრა
67
+ expected: akalamra
68
+
69
+ - source: ლასილი
70
+ expected: lasili
71
+
72
+ - source: გუბაზეული
73
+ expected: gubazeuli
74
+
75
+ - source: ბაყაყი
76
+ expected: baqaqi
77
+
78
+ - source: ძროხა
79
+ expected: jroxa
80
+
81
+ - source: ჰაერი
82
+ expected: haeri
83
+
84
+ - source: ჟოლო
85
+ expected: žolo
86
+
87
+ - source: ჯართი
88
+ expected: ǰart̕i
89
+
90
+ - source: ღრმაღელე
91
+ expected: ġrmaġele
92
+
93
+ map:
94
+ characters:
95
+ '\u10d0' : 'a' # ა
96
+ '\u10d1' : 'b' # ბ
97
+ '\u10d2' : 'g' # გ
98
+ '\u10d3' : 'd' # დ
99
+ '\u10d4' : 'e' # ე
100
+ '\u10d5' : 'v' # ვ
101
+ '\u10d6' : 'z' # ზ
102
+
103
+ '\u10f1' : 'ê' # ჱ
104
+
105
+ '\u10d7' : 't̕' # თ
106
+ '\u10d8' : 'i' # ი
107
+ '\u10d9' : 'k' # კ
108
+ '\u10da' : 'l' # ლ
109
+ '\u10db' : 'm' # მ
110
+ '\u10dc' : 'n' # ნ
111
+
112
+ '\u10f2' : 'y' # ჲ
113
+
114
+ '\u10dd' : 'o' # ო
115
+ '\u10de' : 'p' # პ
116
+ '\u10df' : 'ž' # ჟ
117
+ '\u10e0' : 'r' # რ
118
+ '\u10e1' : 's' # ს
119
+ '\u10e2' : 't' # ტ
120
+
121
+ '\u10f3' : 'w' # ჳ
122
+
123
+ '\u10e3' : 'u' # უ
124
+ '\u10e4' : 'p̕' # ფ
125
+ '\u10e5' : 'k̕' # ქ
126
+ '\u10e6' : 'ġ' # ღ
127
+ '\u10e7' : 'q' # ყ
128
+ '\u10e8' : 'š' # შ
129
+ '\u10e9' : 'č̕' # ჩ
130
+ '\u10ea' : 'c̕' # ც
131
+ '\u10eb' : 'j' # ძ
132
+ '\u10ec' : 'c' # წ
133
+ '\u10ed' : 'č' # ჭ
134
+ '\u10ee' : 'x' # ხ
135
+
136
+ '\u10f4' : 'q̕' # ჴ
137
+
138
+ '\u10ef' : 'ǰ' # ჯ
139
+ '\u10f0' : 'h' # ჰ
140
+
141
+ '\u10f5' : 'ô' # ჵ
142
+
143
+ '\u10f6' : 'f' # ჶ
144
+ '\u10f7' : 'ẹ' # ჷ
145
+ '\u10f8' : 'ʼ' # ჸ
@@ -0,0 +1,84 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:mar
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Marathi"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Marathi system.
12
+
13
+ Information und Dokumentation - Transliteration Devanagari
14
+
15
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
16
+ It is suitable for any application.
17
+
18
+ notes:
19
+ - |
20
+ Vowels:
21
+ The Ardhacandra ॅ is often used to denote English vowels:
22
+ EXAMPLE
23
+ बॅट bêṭa (bat)
24
+ डॉक्टर ḍôkṭara (doctor)
25
+ - |
26
+ Consonants:
27
+
28
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
29
+ Always written during transliteration, also in the final part
30
+ EXAMPLE 1
31
+ पुस्तक pustaka
32
+
33
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
34
+ EXAMPLE 2
35
+ वाक् vāk
36
+
37
+ The anusvāra is always represented with -ṃ-.
38
+ EXAMPLE 3
39
+ संसकरण saṃskaraṇa
40
+
41
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
42
+ EXAMPLE 4
43
+ तंघी kaṃghī becomes kaṅghī
44
+ पंजाबी paṃjābī becomes pañjābī
45
+ पंडित paṃḍita becomes paṇḍita
46
+ संधी saṃdhī becomes sandhī
47
+ दिसंबर disaṃbara becomes disambara
48
+
49
+ Anunāsika or Candrabindu signals the nasalization of vowels
50
+
51
+ EXAMPLE 5
52
+ माँ māṁ
53
+
54
+ tests:
55
+ - source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
56
+ expected: "ṭhāṇe - jilhyāta budhavārī eka hajāra rugṇāñcī vāḍha, tara jaṇāñcyā mṛtyūcī nonda"
57
+ - source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
58
+ expected: "ekatā kapūra punhā aḍakalī vādāta, vebasīrijamadhalyā 'tyā' sīnamuḷe jamāvācī gharāvara dagaḍapheka"
59
+ - source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
60
+ expected: "jāṇūna ghyā, bīemasīcyā adhikāऱ्yānnī kaṅganā rāṇautacyā ôphisamadhale nakkī kāya- kāya toḍalaṃ"
61
+ - source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
62
+ expected: "kaṅganā mumbaīta dākhala hoṇyāpūrvī 'mātośrī'varūna pharmāna suṭale; pravaktyānnā sakta ādeśa"
63
+ - source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
64
+ expected: "marāṭhā ārakṣaṇāsa tātpuratī sthagitī; sarvocca nyāyālayācā nirṇaya"
65
+ - source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
66
+ expected: "bhāratācyā tinhī laśīñcā pahilā ṭappā yaśasvī, vācā kadhī yeṇāra bājārāta"
67
+ - source: "रुग्णवाढीमुळे खाटांची चणचण"
68
+ expected: "rugṇavāḍhīmuḷe khāṭāñcī caṇacaṇa"
69
+ - source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
70
+ expected: "pīema svanidhī karja yojanelā mumbaītūna alpa pratisāda"
71
+ - source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
72
+ expected: "sāntākrūjha-cembūra liṅka roḍavarīla unnata mārgālā sthagitī"
73
+ - source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
74
+ expected: "sampādaka arṇaba gosvāmī yāñcyāvirūddha khaḍaka polisa ṭhāṇyāta takrāra"
75
+
76
+
77
+ map:
78
+
79
+ inherit: 'din-san-Deva-Latn-33904-2018'
80
+
81
+ characters:
82
+
83
+ 'ॲ': 'ê'
84
+ 'ऑ': 'ô'
@@ -0,0 +1,119 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33904-2018
4
+ language: iso-639-2:nep
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Nepali"
8
+ url: https://www.beuth.de/en/standard/din-33904/293049024
9
+ creation_date: 2018
10
+ description: |
11
+ Nepali system.
12
+
13
+ This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
14
+ It is suitable for any application.
15
+
16
+ notes:
17
+ - |
18
+ Vowels:
19
+ The Ardhacandra ॅ is often used to denote English vowels:
20
+ EXAMPLE
21
+ बॅट bêṭa (bat)
22
+ डॉक्टर ḍôkṭara (doctor)
23
+ - |
24
+ Consonants:
25
+
26
+ Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
27
+ Always written during transliteration, also in the final part
28
+ EXAMPLE 1
29
+ पुस्तक pustaka
30
+
31
+ A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
32
+ EXAMPLE 2
33
+ वाक् vāk
34
+
35
+ The anusvāra is always represented with -ṃ-.
36
+ EXAMPLE 3
37
+ संसकरण saṃskaraṇa
38
+
39
+ Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
40
+ EXAMPLE 4
41
+ तंघी kaṃghī becomes kaṅghī
42
+ पंजाबी paṃjābī becomes pañjābī
43
+ पंडित paṃḍita becomes paṇḍita
44
+ संधी saṃdhī becomes sandhī
45
+ दिसंबर disaṃbara becomes disambara
46
+
47
+ Anunāsika or Candrabindu signals the nasalization of vowels
48
+
49
+ EXAMPLE 5
50
+ माँ māṁ
51
+
52
+ tests:
53
+ - source: "लेखन"
54
+ expected: "lekhana"
55
+ - source: "मुद्रा"
56
+ expected: "mudrā"
57
+ - source: "प्रशंसा"
58
+ expected: "praśaṃsā"
59
+ - source: "अंक"
60
+ expected: "aṅka"
61
+ - source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
62
+ expected: "nekapāle sthagita sthāyī kamiṭīko baiṭhaka bhadau gate bolāune bhaeko"
63
+ - source: "न घर रह्यो, न परिवार"
64
+ expected: "na ghara rahyo, na parivāra"
65
+ - source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
66
+ expected: "ḍhorapāṭanamā bhujīkholā bāḍhīpahirole abhibhāvaka gumāekā bālabālikāko bicallī"
67
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
68
+ expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
69
+ - source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
70
+ expected: "saṃvidhāna jārī bhaesaṁgai sārvajanika praśāsanamā nayāṁ utsāha āune apekṣā thiyo"
71
+ - source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
72
+ expected: "deśamā koronā saṅkramita ra mṛtakako saṅkhyā hareka dina baḍhdo cha"
73
+ - source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
74
+ expected: "gāuṁpālikākā adhyakṣa ṭikā guruṅakā anusāra viṣṇudāsalāī rājule sutnakā lāgi belukā sāthī lagekā thie"
75
+ - source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
76
+ expected: "yo āyojanā gāuṁpālikāko kendra tellokamā parcha"
77
+ - source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
78
+ expected: "susmitākā kākā hemabahādura ra kākīlāī pani pahirole bagāyo"
79
+ - source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
80
+ expected: "caita pahilo sātā ghara āekā unī lakaḍāuna bhaepachi yatai rokie"
81
+ - source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
82
+ expected: "kāma garna jāneko hakamā rojagāradātā kampanīko patrasaṁgai vaḍā ra jillā praśāsanako siphārisa anivārya garieko cha"
83
+ - source: "दुःख"
84
+ expected: "duḥkha"
85
+
86
+
87
+ map:
88
+
89
+ inherit: 'din-san-Deva-Latn-33904-2018'
90
+
91
+ characters:
92
+
93
+ 'ॲ': 'ê'
94
+ 'ऑ': 'ô'
95
+
96
+ # Dotted variants
97
+ 'क़': 'ḵa'
98
+ 'ख़': 'ḵha'
99
+ 'ग़': 'g̲a' # \u0067 + \u0332
100
+ 'ज़': 'j̲a' # \u006a + \u0332
101
+ 'ड़': 'ṙa'
102
+ 'ढ़': 'ṙha'
103
+ 'फ़': 'p̲ha' # \u0070 + \u0332
104
+ 'स़': 's̲a' # \u0073 + \u0332
105
+ 'ह़': 'h̲a' # \u0068 + \u0332
106
+ 'व़': 'v̲a' # \u0076 + \u0332
107
+
108
+ # Dotted variants Virāma
109
+ 'क़्': 'ḵ'
110
+ 'ख़्': 'ḵh'
111
+ 'ग़्': 'g̲' # \u0067 + \u0332
112
+ 'ज़्': 'j̲' # \u006a + \u0332
113
+ 'ड़्': 'ṙ'
114
+ 'ढ़्': 'ṙh'
115
+ 'फ़्': 'p̲h' # \u0070 + \u0332
116
+ 'स़्': 's̲' # \u0073 + \u0332
117
+ 'ह़्': 'h̲' # \u0068 + \u0332
118
+
119
+