interscript 0.1.6 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (251) hide show
  1. checksums.yaml +4 -4
  2. data/lib/interscript.rb +10 -6
  3. data/lib/interscript/fs.rb +0 -2
  4. data/lib/interscript/mapping.rb +1 -1
  5. data/lib/interscript/opal.rb +38 -8
  6. data/lib/interscript/opal/entrypoint.rb +12 -0
  7. data/lib/interscript/opal/map_translate.rb +7 -0
  8. data/lib/interscript/version.rb +1 -1
  9. data/maps/acadsin-zho-Hani-Latn-2002.yaml +5 -1
  10. data/maps/alalc-amh-Ethi-Latn-1997.yaml +5 -1
  11. data/maps/alalc-amh-Ethi-Latn-2011.yaml +1 -1
  12. data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -1
  13. data/maps/alalc-asm-Deva-Latn-1997.yaml +9 -3
  14. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  15. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +5 -1
  16. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +5 -1
  17. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  18. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  19. data/maps/alalc-ell-Grek-Latn-1997.yaml +5 -1
  20. data/maps/alalc-ell-Grek-Latn-2010.yaml +1 -2
  21. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  22. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  23. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  24. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  25. data/maps/alalc-kat-Geok-Latn-1997.yaml +1 -1
  26. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  27. data/maps/alalc-kor-Hang-Latn-1997.yaml +5 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  29. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  30. data/maps/alalc-mar-Deva-Latn-1997.yaml +21 -2
  31. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  32. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +1 -1
  33. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  34. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  35. data/maps/{alalc-pan-Deva-Latn-1997.yaml → alalc-pan-Guru-Latn-1997.yaml} +23 -4
  36. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  37. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  38. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  39. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  40. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +5 -1
  41. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +1 -1
  42. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  43. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  44. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  45. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  46. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +1 -1
  47. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  48. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  49. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  50. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  51. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  52. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -1
  53. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  54. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -1
  55. data/maps/bgn-kor-Hang-Latn-1943.yaml +7 -3
  56. data/maps/bgn-kor-Kore-Latn-1943.yaml +3 -3
  57. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  58. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  59. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +5 -1
  60. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +5 -1
  61. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  62. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +2 -2
  63. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +6 -2
  64. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +5 -1
  65. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +5 -1
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  67. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  68. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +5 -1
  69. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -1
  70. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -1
  71. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  72. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  73. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +1 -1
  75. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +1 -1
  76. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +1 -1
  77. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  78. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +1 -1
  79. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  80. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +31 -1
  81. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  82. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  83. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  84. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  85. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  86. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  87. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  88. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  89. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -1
  90. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  91. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  92. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  93. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +1 -1
  94. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +1 -1
  95. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +1 -1
  96. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +1 -1
  97. data/maps/{bis-gjr-Gujr-Latn-13194-1991.yaml → bis-guj-Gujr-Latn-13194-1991.yaml} +17 -2
  98. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +1 -1
  99. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +1 -1
  100. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +1 -1
  101. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +1 -1
  102. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +1 -1
  103. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +1 -1
  104. data/maps/by-bel-Cyrl-Latn-1998.yaml +5 -1
  105. data/maps/by-bel-Cyrl-Latn-2007.yaml +1 -1
  106. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  107. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  108. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  109. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  110. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  111. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  112. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  113. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  114. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  115. data/maps/dos-nep-Deva-Latn-1997.yaml +15 -1
  116. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +3 -3
  117. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +2 -2
  118. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -2
  119. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -2
  120. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -1
  121. data/maps/gki-bel-Cyrl-Latn-1992.yaml +1 -1
  122. data/maps/gki-bel-Cyrl-Latn-2000.yaml +1 -1
  123. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +7 -3
  124. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  125. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  126. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -1
  127. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -1
  128. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -1
  129. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  130. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  131. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -1
  132. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  133. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -1
  134. data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
  135. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  136. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  137. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +8 -4
  138. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -4
  139. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  140. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  141. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  142. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  143. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  144. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  145. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  146. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  147. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  148. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  149. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  150. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  151. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  152. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  153. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  154. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  155. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  156. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  157. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  158. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -3
  159. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  160. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  161. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  162. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +1 -1
  163. data/maps/kp-kor-Hang-Latn-2002.yaml +25 -17
  164. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +1 -1
  165. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  166. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  167. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  168. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  169. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  170. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +2 -2
  171. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +3 -3
  172. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +2 -2
  173. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +2 -2
  174. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  175. data/maps/odni-aze-Cyrl-Latn-2015.yaml +1 -1
  176. data/maps/odni-bel-Cyrl-Latn-2015.yaml +1 -1
  177. data/maps/odni-bul-Cyrl-Latn-2015.yaml +2 -2
  178. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  179. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  180. data/maps/odni-hin-Deva-Latn-2015.yaml +1 -1
  181. data/maps/odni-kat-Geor-Latn-2015.yaml +1 -1
  182. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +1 -1
  183. data/maps/odni-kir-Cyrl-Latn-2015.yaml +1 -1
  184. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  185. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +1 -1
  186. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  187. data/maps/odni-rus-Cyrl-Latn-2015.yaml +1 -1
  188. data/maps/odni-srp-Cyrl-Latn-2015.yaml +1 -1
  189. data/maps/odni-tat-Cyrl-Latn-2015.yaml +1 -1
  190. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +1 -1
  191. data/maps/odni-uig-Cyrl-Latn-2015.yaml +1 -1
  192. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +1 -1
  193. data/maps/odni-urd-Arab-Latn-2015.yaml +1 -1
  194. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +1 -1
  195. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +1 -1
  196. data/maps/royin-tha-Thai-Latn-1968.yaml +5 -1
  197. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +1 -1
  198. data/maps/royin-tha-Thai-Latn-1999.yaml +5 -1
  199. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  200. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  201. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  202. data/maps/ses-ara-Arab-Latn-1930.yaml +5 -1
  203. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  204. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  205. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  206. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  207. data/maps/{ungegn-amh-Ethi-Latn-2016.yaml → un-amh-Ethi-Latn-2016.yaml} +51 -24
  208. data/maps/un-ara-Arab-Latn-1971.yaml +1 -1
  209. data/maps/un-ara-Arab-Latn-1972.yaml +1 -1
  210. data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
  211. data/maps/un-bel-Cyrl-Latn-2007.yaml +1 -1
  212. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  213. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +2 -2
  214. data/maps/un-ell-Grek-Latn-1987-tl.yaml +2 -2
  215. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -3
  216. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  217. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  218. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  219. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  220. data/maps/un-nep-Deva-Latn-1972.yaml +204 -17
  221. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  222. data/maps/un-rus-Cyrl-Latn-1987.yaml +1 -1
  223. data/maps/un-ukr-Cyrl-Latn-1998.yaml +35 -12
  224. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  225. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  226. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  227. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  228. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +1 -1
  229. data/maps/var-kor-Hang-Latn-mr-1939.yaml +2 -2
  230. data/maps/var-kor-Kore-Hang-2013.yaml +1 -1
  231. data/maps/var-kor-Kore-Latn-mr-1939.yaml +1 -1
  232. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  233. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  234. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  235. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  236. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  237. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  238. data/maps/var-tha-Thai-Thai-phonemic.yaml +1 -1
  239. data/maps/var-tha-Thai-Zsym-ipa.yaml +1 -1
  240. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +6 -2
  241. data/spec/interscript/filenames_spec.rb +384 -0
  242. data/spec/interscript_spec.rb +7 -4
  243. metadata +105 -26
  244. data/bin/interscript +0 -41
  245. data/bin/rspec +0 -29
  246. data/bin/setup +0 -8
  247. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  248. data/lib/interscript-opal.rb +0 -2
  249. data/lib/interscript/opal_map_translate.rb +0 -12
  250. data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
  251. data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
@@ -0,0 +1,213 @@
1
+ ---
2
+ authority_id: din
3
+ id: 33903-2016
4
+ language: iso-639-2:tam
5
+ source_script: Taml
6
+ destination_script: Latn
7
+ name: "DIN 33903:2016-02: Information und Dokumentation - Umschrift Tamil"
8
+ url: https://www.beuth.de/de/norm/din-33903/247150527
9
+ creation_date: 2018
10
+ description: |
11
+ This standard specifies the transcription of the letters of the
12
+ Tamil alphabet in Latin letters. It is based on international
13
+ standards as well as on the preprint of the alphabetical tables,
14
+ which were published in 1976 with the introduction of the rules for
15
+ alphabetical cataloging. It can be used in all areas, but in
16
+ particular the aim is to standardize the library and publication
17
+ area.
18
+
19
+ notes:
20
+ - |
21
+ Since the Tamil script is a syllabic script, the consonant -a inherent in the transliteration is always written, even in the final.
22
+
23
+ - |
24
+ A point above the consonant, the so-called "pulli", means in Tamil that the inherent -a is omitted:
25
+ கார்த்திகேயன் kārttikēyaṉ
26
+ - |
27
+ Tamil has no anusvara; in contrast to other South Asian scripts, the class nasal is always written.
28
+ - |
29
+ Tamil also has no ligatures.
30
+
31
+ tests:
32
+ - source: "கார்த்திகேயன்"
33
+ expected: "kārttikēyaṉ"
34
+ - source: "௲"
35
+ expected: "1000"
36
+ - source: "இளைஞர்களின் உறுதியான மனநிலையை பிரதிபலிக்கிறது: நீட் தேர்வில் ௮௫-௯௦ சதவீத மாணவர்கள் பங்கேற்பு - ரமேஷ் பொக்ரியால்"
37
+ expected: "iḷaiñarkaḷiṉ uṟutiyāṉa maṉanilaiyai piratipalikkiṟatu: nīṭ tērvil 85-90 catavīta māṇavarkaḷ paṅkēṟpu - ramēṣ pokriyāl"
38
+ - source: "நாடாளுமன்றத்தில் 4 மசோதாக்களை எதிர்க்க காங்கிரஸ் முடிவு - ஜெயராம் ரமேஷ்"
39
+ expected: "nāṭāḷumaṉṟattil 4 macōtākkaḷai etirkka kāṅkiras muṭivu - jeyarām ramēṣ"
40
+ - source: "கர்நாடகாவில் மேலும் 9,894 பேருக்கு கொரோனா தொற்று உறுதி"
41
+ expected: "karnāṭakāvil mēlum 9,894 pērukku korōṉā toṟṟu uṟuti"
42
+ - source: "ஐதராபாத்துக்கு கைகொடுக்குமா அதிரடி?"
43
+ expected: "aitarāpāttukku kaikoṭukkumā atiraṭi?"
44
+ - source: "அமெரிக்க ஓபன் டென்னிஸ்: இறுதிப்போட்டியில் டொமினிக்-ஸ்வெரேவ்"
45
+ expected: "amerikka ōpaṉ ṭeṉṉis: iṟutippōṭṭiyil ṭomiṉik-sverēv"
46
+ - source: "ஐ.பி.எல். கிரிக்கெட்டில் களம் இறங்கும் அமெரிக்க வீரர்"
47
+ expected: "ai.pi.el. kirikkeṭṭil kaḷam iṟaṅkum amerikka vīrar"
48
+ - source: "அமெரிக்க ஓபன் டென்னிஸ்; நவோமி ஒசாகா சாம்பியன் பட்டம் வென்றார்"
49
+ expected: "amerikka ōpaṉ ṭeṉṉis; navōmi ocākā cāmpiyaṉ paṭṭam veṉṟār"
50
+ - source: "புதிய கல்விக்கொள்கைக்கு எதிர்ப்பு: முன்னாள் துணைவேந்தர்கள் 20 பேர் பிரதமருக்கு கடிதம்"
51
+ expected: "putiya kalvikkoḷkaikku etirppu: muṉṉāḷ tuṇaivēntarkaḷ 20 pēr piratamarukku kaṭitam"
52
+ - source: "இந்த ஆண்டு ஐ.பி.எல். கோப்பையை எந்த அணி வெல்லும்? - கெவின் பீட்டர்சன் கணிப்பு"
53
+ expected: "inta āṇṭu ai.pi.el. kōppaiyai enta aṇi vellum? - keviṉ pīṭṭarcaṉ kaṇippu"
54
+ - source: "இந்திய எண்ணெய் கப்பலில் தீ: விபத்து குறித்த எச்சரிக்கையை கப்பல் அதிகாரிகள் புறக்கணித்தனர் - இலங்கை கோர்ட்டு தகவல்"
55
+ expected: "intiya eṇṇey kappalil tī: vipattu kuṟitta eccarikkaiyai kappal atikārikaḷ puṟakkaṇittaṉar - ilaṅkai kōrṭṭu takaval"
56
+
57
+ map:
58
+
59
+ rules:
60
+ - pattern: ([க]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
61
+ result: 'k'
62
+ - pattern: ([ங]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
63
+ result: 'ṅ'
64
+ - pattern: ([ச]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
65
+ result: 'c'
66
+ - pattern: ([ஞ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
67
+ result: 'ñ'
68
+ - pattern: ([ட]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
69
+ result: 'ṭ'
70
+ - pattern: ([ண]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
71
+ result: 'ṇ'
72
+ - pattern: ([த]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
73
+ result: 't'
74
+ - pattern: ([ந]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
75
+ result: 'n'
76
+ - pattern: ([ப]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
77
+ result: 'p'
78
+ - pattern: ([ம]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
79
+ result: 'm'
80
+ - pattern: ([ய]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
81
+ result: 'y'
82
+ - pattern: ([ர]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
83
+ result: 'r'
84
+ - pattern: ([ல]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
85
+ result: 'l'
86
+ - pattern: ([ள]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
87
+ result: 'ḷ'
88
+ - pattern: ([ழ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
89
+ result: 'ḻ'
90
+ - pattern: ([வ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
91
+ result: 'v'
92
+ - pattern: ([ற]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
93
+ result: 'ṟ'
94
+ - pattern: ([ன]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
95
+ result: 'ṉ'
96
+ - pattern: ([ஜ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
97
+ result: 'j'
98
+ - pattern: ([ஶ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
99
+ result: 'ś'
100
+ - pattern: ([ஷ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
101
+ result: 'ṣ'
102
+ - pattern: ([ஸ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
103
+ result: 's'
104
+ - pattern: ([ஹ]=?)(?=[\u0BBE\u0BBF\u0BC0\u0BC1\u0BC2\u0BC6\u0BC7\u0BC8\u0BCA\u0BCB\u0BCC\u094B\u094C])
105
+ result: 'h'
106
+
107
+ characters:
108
+ 'அ': 'a'
109
+ 'ஆ': 'ā'
110
+ 'ா': 'ā'
111
+
112
+ 'இ': 'i'
113
+ 'ி': 'i'
114
+
115
+ 'ஈ': 'ī'
116
+ 'ீ': 'ī'
117
+
118
+ 'உ': 'u'
119
+ 'ு': 'u'
120
+
121
+ 'ஊ': 'ū'
122
+ 'ூ': 'ū'
123
+
124
+ 'ெ': "e"
125
+ 'எ': 'e'
126
+
127
+ 'ே': "ē"
128
+ 'ஏ': 'ē'
129
+
130
+ 'ஐ': 'ai'
131
+ 'ை': "ai"
132
+
133
+ 'ஒ': 'o'
134
+ 'ொ': 'o'
135
+
136
+ 'ோ': 'ō'
137
+ 'ஓ': 'ō'
138
+
139
+ 'ஔ': 'au'
140
+ 'ௌ': 'au'
141
+
142
+ 'க்': 'k'
143
+ 'ங்': 'ṅ'
144
+ 'ச்': 'c'
145
+ 'ஞ்': 'ñ'
146
+ 'ட்': 'ṭ'
147
+ 'ண்': 'ṇ'
148
+ 'த்': 't'
149
+ 'ந்': 'n'
150
+ 'ப்': 'p'
151
+ 'ம்': 'm'
152
+ 'ய்': 'y'
153
+ 'ர்': 'r'
154
+ 'ல்': 'l'
155
+ 'ள்': 'ḷ'
156
+ 'ழ்': 'ḻ'
157
+ 'வ்': 'v'
158
+ 'ற்': 'ṟ'
159
+ 'ன்': 'ṉ'
160
+ 'ஜ்': 'j'
161
+
162
+ 'ஶ்': 'ś'
163
+ 'ஷ்': 'ṣ'
164
+ 'ஸ்': 's'
165
+ 'ஹ்': 'h'
166
+
167
+
168
+ 'க': 'ka'
169
+ 'ங': 'ṅa'
170
+ 'ஃ': 'ḵ'
171
+ 'ச': 'ca'
172
+ 'ஞ': 'ña'
173
+ 'ட': 'ṭa'
174
+ 'ண': 'ṇa'
175
+ 'த': 'ta'
176
+ 'ந': 'na'
177
+ 'ப': 'pa'
178
+ 'ம': 'ma'
179
+ 'ய': 'ya'
180
+ 'ர': 'ra'
181
+ 'ல': 'la'
182
+ 'ள': 'ḷa'
183
+ 'ழ': 'ḻa'
184
+ 'வ': 'va'
185
+ 'ற': 'ṟa'
186
+ 'ன': 'ṉa'
187
+ 'ஜ': 'ja'
188
+ 'ஶ': 'śa'
189
+ 'ஷ': 'ṣa'
190
+ 'ஸ': 'sa'
191
+ 'ஹ': 'ha'
192
+
193
+ # Digits
194
+ '௧': '1'
195
+ '௨': '2'
196
+ '௩': '3'
197
+ '௪': '4'
198
+ '௫': '5'
199
+ '௬': '6'
200
+ '௭': '7'
201
+ '௮': '8'
202
+ '௯': '9'
203
+ '௦': '0'
204
+ '௰': '10'
205
+ '௱': '100'
206
+ '௲': '1000'
207
+
208
+
209
+
210
+
211
+ "‍": '' # no need for zero with joiner
212
+ "‌": '' # no need for zero with non joiner
213
+
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1997
4
- language: nep
4
+ language: iso-639-2:nep
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
7
  name: Nepali Romanization, 1997
@@ -22,6 +22,20 @@ notes:
22
22
  tests:
23
23
  - source: "दुःख"
24
24
  expected: "duhkh"
25
+ - source: "पूरा भइसकेका विषयलाई माग बनाएर दबाब नदिनुस्"
26
+ expected: "pūrā bhiskekā viṣylāī māg bnāer dbāb ndinusa"
27
+ - source: "जाँदै छ कता नेपाली संगीत"
28
+ expected: "jā~dai chh ktā nepālī sṅgīt"
29
+ - source: "३५ मिनेटको यो डकुमेन्ट्री फिल्मले प्रथम पुरस्कारस्वरूप ग्रान्ड पिक्स अवार्ड पाएको हो"
30
+ expected: "35 mineṭko yo ḍkumenaṭarī philamle parthm pursakārsavrūp garānaḍ pikas avāraḍ pāeko ho"
31
+ - source: "विक्षनरी"
32
+ expected: "vikṣnrī"
33
+ - source: "रुसमा उत्कृष्ट"
34
+ expected: "rusmā utakṛiṣaṭ"
35
+ - source: "वाणिज्य"
36
+ expected: "vāṇijay"
37
+ - source: "अंक विद्या"
38
+ expected: "aṅk vidayā"
25
39
 
26
40
  map:
27
41
 
@@ -1,7 +1,7 @@
1
1
  ---
2
- authority_id: un
3
- id: 1982
4
- language: ell
2
+ authority_id: elot
3
+ id: 1982-tl
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: ELOT 743:1982 (transliteration)
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: elot
3
- id: 1982
4
- language: ell
3
+ id: 1982-ts
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: ELOT 743:1982
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: elot
3
- id: 2001
4
- language: ell
3
+ id: 2001-tl
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: ELOT 743:2001
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: elot
3
- id: 2001
4
- language: ell
3
+ id: 2001-ts
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: ELOT 743:2001
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: ggg
3
3
  id: 2002
4
- language: kat
4
+ language: iso-639-2:kat
5
5
  source_script: Geor
6
6
  destination_script: Latn
7
7
  name: Georgian State Department of Geodesy and Cartography 2002 System
8
+ alias:
9
+ ogc11122:
10
+ code: kat_Geor2Latn_GGG_2002
11
+ description: Georgian State Department of Geodesy and Cartography 2002 System
8
12
  url: https://transliteration.eki.ee/pdf/Georgian.pdf
9
13
  creation_date: 1998
10
14
  confirmation_date: 2002
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: gki
3
3
  id: 1992
4
- language: bel
4
+ language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: Byelorussian National Cartographic Authority 1992-3 System (based on GOST 1983)
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: gki
3
3
  id: 2000
4
- language: bel
4
+ language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: On approval of the Instructions for the transliteration of geographical names of the Republic of Belarus with letters of the Latin alphabet
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: gost
3
3
  id: 1983
4
- language: rus
4
+ language: iso-639-2:rus
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: LETTERS TRANSLATION RULES OF KIRILLOVSKY ALPHABET WITH LETTERS OF LATIN ALPHABET GOST 16876-71
8
+ alias:
9
+ ogc11122:
10
+ code: rus_Cyrl2Latn_GOST_1983
11
+ description: Russian GOST 1983 System, Main Administration of Geodesy and Cartography of the Former Soviet Union
8
12
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/7th-uncsgn-docs/econf/7th_UNCSGN_econf.91_3_Add1.pdf
9
13
  creation_date: 1978
10
14
  confirmation_date: 1982-04-16
@@ -147,7 +151,7 @@ map:
147
151
  '\u042a' : '"' # Ъ
148
152
  '\u042B' : 'Y' # Ы
149
153
  '\u042C' : "\u00B4" # Ь => ’
150
- '\u042D' : "E\u0300" # È
154
+ '\u042D' : "E\u0300" # Э =>
151
155
  '\u042E' : 'Ju' # Ю
152
156
  '\u042F' : 'Ja' # Я
153
157
 
@@ -181,6 +185,6 @@ map:
181
185
  '\u044A' : '"' # ъ
182
186
  '\u044B' : 'y' # ы
183
187
  '\u044C' : "\u00B4" # ь => ’
184
- '\u044D' : "e\u0300" # è
188
+ '\u044D' : "e\u0300" # э => è
185
189
  '\u044E' : 'ju' # ю
186
190
  '\u044F' : 'ja' # я
@@ -0,0 +1,157 @@
1
+ ---
2
+ authority_id: gost
3
+ id: 2002
4
+ language: iso-639-2:rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: GOST 7.79-2000 System of standards for information, librarianship and publishing. Rules for transliteration of Cyrillic letters in the Latin alphabet
8
+ url: https://gostexpert.ru/gost/gost-7.79-2000
9
+ creation_date: 2002
10
+ confirmation_date: 2002-02-12
11
+ adoption_date: 2002-02-12
12
+ description: |
13
+ This standard applies to the rules of transliteration by means of the Latin alphabet of individual letters,
14
+ words, expressions, as well as related texts in languages ​​whose writing is based on the Cyrillic alphabet.
15
+ The rules in accordance with this standard are applied wherever it is required to provide an unambiguous
16
+ representation of the Cyril text in Latin letters and the possibility of algorithmic recovery of the text
17
+ in the original Cyrillic notation, in particular when transferring documents over computer networks.
18
+ This standard does not apply to the rules for the transmission of the sound appearance of words written in
19
+ Cyrillic in Latin letters.
20
+
21
+ tests:
22
+ - source: адрес
23
+ expected: adres
24
+ - source: баба
25
+ expected: baba
26
+ - source: вы
27
+ expected: vy
28
+ - source: голова
29
+ expected: golova
30
+ - source: да
31
+ expected: da
32
+ - source: еда
33
+ expected: eda
34
+ - source: ёлка
35
+ expected: ëlka
36
+ - source: журнал
37
+ expected: žurnal
38
+ - source: звезда
39
+ expected: zvezda
40
+ - source: книга
41
+ expected: kniga
42
+ - source: первый
43
+ expected: pervyj
44
+ - source: как
45
+ expected: kak
46
+ - source: липа
47
+ expected: lipa
48
+ - source: муж
49
+ expected: muž
50
+ - source: нижний
51
+ expected: nižnij
52
+ - source: общество
53
+ expected: obŝestvo
54
+ - source: пара
55
+ expected: para
56
+ - source: рыба
57
+ expected: ryba
58
+ - source: сестра
59
+ expected: sestra
60
+ - source: товарищ
61
+ expected: tovariŝ
62
+ - source: утро
63
+ expected: utro
64
+ - source: физика
65
+ expected: fizika
66
+ - source: химический
67
+ expected: himičeskij
68
+ - source: центр
69
+ expected: centr
70
+ - source: часы
71
+ expected: časy
72
+ - source: школа
73
+ expected: škola
74
+ - source: щит
75
+ expected: ŝit
76
+ - source: съезд
77
+ expected: s"ezd
78
+ - source: был
79
+ expected: byl
80
+ - source: альбом
81
+ expected: al´bom
82
+ - source: это
83
+ expected: èto
84
+ - source: южный
85
+ expected: ûžnyj
86
+ - source: яма
87
+ expected: âma
88
+
89
+ map:
90
+ characters:
91
+ '\u0410' : 'A' # A
92
+ '\u0411' : 'B' # Б
93
+ '\u0412' : 'V' # B
94
+ '\u0413' : 'G' # Г
95
+ '\u0414' : 'D' # Д
96
+ '\u0415' : 'E' # Е
97
+ '\u0401' : "\u00CB" # Ё
98
+ '\u0416' : 'Ž' # Ж
99
+ '\u0417' : 'Z' # З
100
+ '\u0418' : "I" # И
101
+ '\u0419' : 'J' # Й
102
+ '\u041A' : 'K' # К
103
+ '\u041B' : 'L' # Л
104
+ '\u041C' : 'M' # М
105
+ '\u041D' : 'N' # Н
106
+ '\u041E' : 'O' # О
107
+ '\u041F' : 'P' # П
108
+ '\u0420' : 'R' # Р
109
+ '\u0421' : 'S' # С
110
+ '\u0422' : 'T' # Т
111
+ '\u0423' : 'U' # У
112
+ '\u0424' : 'F' # Ф
113
+ '\u0425' : 'H' # Х
114
+ '\u0426' : 'C' # Ц
115
+ '\u0427' : 'Č' # Ч
116
+ '\u0428' : 'Š' # Ш
117
+ '\u0429' : 'Ŝ' # Щ
118
+ '\u042a' : '"' # Ъ
119
+ '\u042B' : 'Y' # Ы
120
+ '\u042C' : "\u00B4" # Ь => ’
121
+ '\u042D' : "E\u0300" # Э => È
122
+ '\u042E' : 'Û' # Ю
123
+ '\u042F' : 'Â' # Я
124
+
125
+ '\u0430' : 'a' # а
126
+ '\u0431' : 'b' # б
127
+ '\u0432' : 'v' # в
128
+ '\u0433' : 'g' # г
129
+ '\u0434' : 'd' # д
130
+ '\u0435' : 'e' # е
131
+ '\u0451' : "\u00EB" # ё
132
+ '\u0436' : 'ž' # ж
133
+ '\u0437' : 'z' # з
134
+ '\u0438' : 'i' # и
135
+ '\u0439' : 'j' # й
136
+ '\u043A' : 'k' # к
137
+ '\u043B' : 'l' # л
138
+ '\u043C' : 'm' # м
139
+ '\u043D' : 'n' # н
140
+ '\u043E' : 'o' # о
141
+ '\u043F' : 'p' # п
142
+ '\u0440' : 'r' # р
143
+ '\u0441' : 's' # с
144
+ '\u0442' : 't' # т
145
+ '\u0443' : 'u' # у
146
+ '\u0444' : 'f' # ф
147
+ '\u0445' : 'h' # х
148
+ '\u0446' : 'c' # ц
149
+ '\u0447' : 'č' # ч
150
+ '\u0448' : 'š' # ш
151
+ '\u0449' : 'ŝ' # щ
152
+ '\u044A' : '"' # ъ
153
+ '\u044B' : 'y' # ы
154
+ '\u044C' : "\u00B4" # ь => ’
155
+ '\u044D' : "e\u0300" # э => è
156
+ '\u044E' : 'û' # ю
157
+ '\u044F' : 'â' # я