interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,144 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2012
4
+ language: iso-639-2:pli
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Pali Romanization, 2012
8
+ url: https://www.loc.gov/catdir/cpso/romanization/pali.pdf
9
+ creation_date: 2012
10
+ description: |
11
+ ALA-LC Romanization table for Pali
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Niggahīta combinations representing nasals are romanized by ṅ
29
+ before gutturals, ñ before palatals, ṇ before cerebrals, n before dentals, and m before
30
+ labials.
31
+
32
+ tests:
33
+ - source: "तेन खो पन समयेन वेसालिया अविदूरे कलन्दगामो नाम अत्थि"
34
+ expected: "taena khao pana samayaena vaesaālaiyaā avaidaūrae kalanadagaāmao naāma atathai"
35
+ - source: "तत्थ सुदिन्‍नो नाम कलन्दपुत्तो सेट्ठिपुत्तो होति"
36
+ expected: "tatatha saudainanao naāma kalanadapautatao saeṭaṭhaipautatao haotai"
37
+ - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो सम्बहुलेहि"
38
+ expected: "atha khao saudainanao kalanadapautatao samabahaulaehai"
39
+ - source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
40
+ expected: "tathaā cataurabhaiḥ paurauṣaḥ paraīkaṣayatae tayaāgaena śaīlaena gauṇaena karamaṇaā"
41
+ - source: "अथ खो सुदिन्‍नो कलन्दपुत्तो अचिरवुट्ठिताय परिसाय येन भगवा तेनुपसङ्कमि; उपसङ्कमित्वा भगवन्तं अभिवादेत्वा एकमन्तं निसीदि"
42
+ expected: "atha khao saudainanao kalanadapautatao acairavauṭaṭhaitaāya paraisaāya yaena bhagavaā taenaupasaṅakamai; upasaṅakamaitavaā bhagavanataṃ abhaivaādaetavaā ekamanataṃ naisaīdai"
43
+ - source: "अथ खो सुदिन्‍नस्स कलन्दपुत्तस्स मातापितरो सुदिन्‍नं कलन्दपुत्तं एतदवोचुं"
44
+ expected: "atha khao saudainanasasa kalanadapautatasasa maātaāpaitarao saudainanaṃ kalanadapautataṃ etadavaocauṃ"
45
+ - source: "त्वं खोसि, तात सुदिन्‍न, अम्हाकं एकपुत्तको पियो मनापो सुखेधितो सुखपरिहतो"
46
+ expected: "tavaṃ khaosai, taāta saudainana, amahaākaṃ ekapautatakao paiyao manaāpao saukhaedhaitao saukhaparaihatao"
47
+ - source: "न त्वं, तात सुदिन्‍न, किञ्‍चि दुक्खस्स जानासि"
48
+ expected: "na tavaṃ, taāta saudainana, kaiñacai daukakhasasa jaānaāsai"
49
+ - source: "अनुञ्‍ञातोम्हि किर मातापितूहि अगारस्मा अनगारियं पब्बज्‍जाया’’ति, हट्ठो उदग्गो पाणिना गत्तानि परिपुञ्छन्तो वुट्ठासि"
50
+ expected: "anauñañaātaomahai kaira maātaāpaitaūhai agaārasamaā anagaāraiyaṃ pababajajaāyaā’’tai, haṭaṭhao udagagao paāṇainaā gatataānai paraipauñachanatao vauṭaṭhaāsai"
51
+
52
+ map:
53
+
54
+ rules:
55
+ # note[3]
56
+ - pattern: \u0902(?=[कखगघङ])
57
+ result: ṅ
58
+ - pattern: \u0902(?=[चछजझञ])
59
+ result: ñ
60
+ - pattern: \u0902(?=[टठडढण])
61
+ result: ṇ
62
+ - pattern: \u0902(?=[तथदधन])
63
+ result: n
64
+
65
+ characters:
66
+
67
+ # I. Vowels and Diphthongs (see Note 1)
68
+
69
+ 'अ': 'a'
70
+ 'आ': 'ā'
71
+ 'इ': 'i'
72
+ 'ई': 'ī'
73
+ 'उ': 'u'
74
+ 'ऊ': 'ū'
75
+ 'ए': 'e'
76
+ 'ओ': 'o'
77
+
78
+ # II. Consonants (see Note 2)
79
+ # Gutturals
80
+ 'क': 'ka'
81
+ 'ख': 'kha'
82
+ 'ग': 'ga'
83
+ 'घ': 'gha'
84
+ 'ङ': 'ṅa'
85
+
86
+ # Palatals
87
+ 'च': 'ca'
88
+ 'छ': 'cha'
89
+ 'ज': 'ja'
90
+ 'झ': 'jha'
91
+ 'ञ': 'ña'
92
+
93
+ # Cerebrals
94
+ 'ट': 'ṭa'
95
+ 'ठ': 'ṭha'
96
+ 'ड': 'ḍa'
97
+ 'ढ': 'ḍha'
98
+ 'ण': 'ṇa'
99
+
100
+ # Dentals
101
+ 'त': 'ta'
102
+ 'थ': 'tha'
103
+ 'द': 'da'
104
+ 'ध': 'dha'
105
+ 'न': 'na'
106
+
107
+ # Labials
108
+ 'प': 'pa'
109
+ 'फ': 'pha'
110
+ 'ब': 'ba'
111
+ 'भ': 'bha'
112
+ 'म': 'ma'
113
+
114
+ # Semivowels
115
+ 'य': 'ya'
116
+ 'र': 'ra'
117
+ 'ल': 'la'
118
+ 'ळ': 'ḻa'
119
+ 'व': 'va'
120
+
121
+ # Sibilants
122
+ 'श': 'śa'
123
+ 'ष': 'ṣa'
124
+ 'स': 'sa'
125
+
126
+ # Aspirate
127
+ 'ह': 'ha'
128
+
129
+ # Visagga
130
+ 'ः': 'ḥ'
131
+
132
+ # Niggahīta/Anusvāra
133
+ 'ं': 'ṃ'
134
+
135
+ # Medials # Needed for connecting constants
136
+ 'ा': "ā"
137
+ 'ि': "i"
138
+ 'ी': "ī"
139
+ 'ु': "u"
140
+ 'ू': "ū"
141
+ 'े': "e"
142
+ 'ो': "o"
143
+ '्': ""
144
+ '‍': ''# Used for joining
@@ -0,0 +1,47 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2012
4
+ language: iso-639-2:pra
5
+ source_script: Deva
6
+ destination_script: Latn
7
+ name: Prakrit Romanization, 2012
8
+ url: https://www.loc.gov/catdir/cpso/romanization/sanskrit.pdf
9
+ creation_date: 2012
10
+ description: |
11
+ ALA-LC Romanization table for Prakrit
12
+
13
+ notes:
14
+
15
+ - Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
16
+ vowels following a consonant can be found in grammars; no distinction between the two is
17
+ made in transliteration.
18
+
19
+ - |
20
+ The vowel a is implicit after all consonants and consonant clusters and is supplied in
21
+ transliteration, with the following exceptions:
22
+
23
+ a) when another vowel is indicated by its appropriate sign; and
24
+ b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
25
+ virāma.
26
+
27
+ - |
28
+ Exception: Anusvāra is transliterated by:
29
+
30
+ a) ṅ before gutturals,
31
+ b) ñ before palatals,
32
+ c) ṇ before cerebrals,
33
+ d) n before dentals, and
34
+ e) m before labials.
35
+ In other circumstances it is transliterated by a tilde (~) over the vowel.
36
+
37
+ - When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
38
+
39
+ tests:
40
+ - source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
41
+ expected: "saṛṣaṭaisathaitaivainaāśaānaāṃ śakataibhaūtae sanaātanai"
42
+ - source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
43
+ expected: "gauṇaāśarayae gauṇamayae naāraāyaṇai namao’satau tae"
44
+
45
+ map:
46
+
47
+ inherit: "alalc-san-Deva-Latn-2012"
@@ -0,0 +1,225 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 1997
4
+ language: iso-639-2:rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ALA-LC Romanization System 1997
8
+ alias:
9
+ ogc11122:
10
+ code: rus_Cyrl2Latn_ALA_1997
11
+ description: Russian ALA-Library of Congress 1997 System
12
+ url: https://en.wikipedia.org/wiki/ALA-LC_romanization_for_Russian
13
+ creation_date: 1997
14
+ description: |
15
+ The ALA-LC Romanization tables for Slavic alphabets is a set of standards for romanization of texts
16
+ in various writing systems used in North American libraries and publications.
17
+ This version was published by the American Library Association and the Library of Congress in 1997.
18
+ This article is about the ALA-LC method of transliteration of Russian-language text from Cyrillic script to Latin script.
19
+
20
+ The formal, unambiguous version of the system requires some diacritics and two-letter tie characters which are often omitted in practice.
21
+
22
+ notes:
23
+ - Pre-1918 letters skipped
24
+ - Pre-18th century letters skipped
25
+
26
+ tests:
27
+ - source: Азов
28
+ expected: Azov
29
+ - source: Тамбов
30
+ expected: Tambov
31
+ - source: Барнаул
32
+ expected: Barnaul
33
+ - source: Кубань
34
+ expected: Kubanʹ
35
+ - source: Владимир
36
+ expected: Vladimir
37
+ - source: Ульяновск
38
+ expected: Ulʹi͡anovsk
39
+ - source: Грозный
40
+ expected: Groznyǐ
41
+ - source: Волгодонск
42
+ expected: Volgodonsk
43
+ - source: Дзержинский
44
+ expected: Dzerzhinskiǐ
45
+ - source: Нелидово
46
+ expected: Nelidovo
47
+ - source: Елизово
48
+ expected: Elizovo
49
+ - source: Чебоксары
50
+ expected: Cheboksary
51
+ - source: Ёлкин
52
+ expected: Ëlkin
53
+ - source: Озёрный
54
+ expected: Ozërnyǐ
55
+ - source: Жуков
56
+ expected: Zhukov
57
+ - source: Лужники
58
+ expected: Luzhniki
59
+ - source: Звенигород
60
+ expected: Zvenigorod
61
+ - source: Вязьма
62
+ expected: Vi͡azʹma
63
+ - source: Иркутск
64
+ expected: Irkutsk
65
+ - source: Апатиты
66
+ expected: Apatity
67
+ - source: Йошкар-Ола
68
+ expected: Ǐoshkar-Ola
69
+ - source: Бийск
70
+ expected: Biǐsk
71
+ - source: Киров
72
+ expected: Kirov
73
+ - source: Енисейск
74
+ expected: Eniseǐsk
75
+ - source: Ломоносов
76
+ expected: Lomonosov
77
+ - source: Нелидово
78
+ expected: Nelidovo
79
+ - source: Менделеев
80
+ expected: Mendeleev
81
+ - source: Каменка
82
+ expected: Kamenka
83
+ - source: Новосибирск
84
+ expected: Novosibirsk
85
+ - source: Кандалакша
86
+ expected: Kandalaksha
87
+ - source: Омск
88
+ expected: Omsk
89
+ - source: Красноярск
90
+ expected: Krasnoi͡arsk
91
+ - source: Петрозаводск
92
+ expected: Petrozavodsk
93
+ - source: Серпухов
94
+ expected: Serpukhov
95
+ - source: Ростов
96
+ expected: Rostov
97
+ - source: Северобайкальск
98
+ expected: Severobaǐkalʹsk
99
+ - source: Сковородино
100
+ expected: Skovorodino
101
+ - source: Чайковский
102
+ expected: Chaǐkovskiǐ
103
+ - source: Тамбов
104
+ expected: Tambov
105
+ - source: Мытищи
106
+ expected: Mytishchi
107
+ - source: Углич
108
+ expected: Uglich
109
+ - source: Дудинка
110
+ expected: Dudinka
111
+ - source: Фурманов
112
+ expected: Furmanov
113
+ - source: Уфа
114
+ expected: Ufa
115
+ - source: Хабаровск
116
+ expected: Khabarovsk
117
+ - source: Прохладный
118
+ expected: Prokhladnyǐ
119
+ - source: Цимлянск
120
+ expected: T͡Simli͡ansk
121
+ - source: Ельцин
122
+ expected: Elʹt͡sin
123
+ - source: Чебоксары
124
+ expected: Cheboksary
125
+ - source: Печора
126
+ expected: Pechora
127
+ - source: Шахтёрск
128
+ expected: Shakhtërsk
129
+ - source: Мышкин
130
+ expected: Myshkin
131
+ - source: Щёлково
132
+ expected: Shchëlkovo
133
+ - source: Ртищево
134
+ expected: Rtishchevo
135
+ - source: Подъездной
136
+ expected: Podʺezdnoǐ
137
+ - source: Ыттык-Кёль
138
+ expected: Yttyk-Këlʹ
139
+ - source: Тында
140
+ expected: Tynda
141
+ - source: Тюмень
142
+ expected: Ti͡umenʹ
143
+ - source: Электрогорск
144
+ expected: Ėlektrogorsk
145
+ - source: Радиоэлектроника
146
+ expected: Radioėlektronika
147
+ - source: Юбилейный
148
+ expected: I͡Ubileǐnyǐ
149
+ - source: Ключевская
150
+ expected: Kli͡uchevskai͡a
151
+ - source: Якутск
152
+ expected: I͡Akutsk
153
+ - source: Брянск
154
+ expected: Bri͡ansk
155
+
156
+ map:
157
+ characters:
158
+ "\u0027": "" # '
159
+ "\u0410": "A" # А
160
+ "\u0411": "B" # Б
161
+ "\u0412": "V" # В
162
+ "\u0413": "G" # Г
163
+ "\u0414": "D" # Д
164
+ "\u0415": "E" # Е
165
+ "\u0401": "Ë" # Ё
166
+ "\u0416": "Zh" # Ж
167
+ "\u0417": "Z" # З
168
+ "\u0418": "I" # И
169
+ "\u0419": "\u01CF" # Й
170
+ "\u041A": "K" # К
171
+ "\u041B": "L" # Л
172
+ "\u041C": "M" # М
173
+ "\u041D": "N" # Н
174
+ "\u041E": "O" # О
175
+ "\u041F": "P" # П
176
+ "\u0420": "R" # Р
177
+ "\u0421": "S" # С
178
+ "\u0422": "T" # Т
179
+ "\u0423": "U" # У
180
+ "\u0424": "F" # Ф
181
+ "\u0425": "Kh" # Х
182
+ "\u0426": "T\u0361S" # Ц
183
+ "\u0427": "Ch" # Ч
184
+ "\u0428": "Sh" # Ш
185
+ "\u0429": "Shch" # Щ
186
+ "\u042A": "ʺ" # Ъ
187
+ "\u042B": "Y" # Ы
188
+ "\u042C": "ʹ" # Ь
189
+ "\u042D": "E\u0307" # Э
190
+ "\u042E": "I\u0361U" # Ю
191
+ "\u042F": "I\u0361A" # Я
192
+
193
+ "\u0430": "a" # а
194
+ "\u0431": "b" # б
195
+ "\u0432": "v" # в
196
+ "\u0433": "g" # г
197
+ "\u0434": "d" # д
198
+ "\u0435": "e" # e
199
+ "\u0451": "ë" # ё
200
+ "\u0436": "zh" # ж
201
+ "\u0437": "z" # з
202
+ "\u0438": "i" # и
203
+ "\u0439": "\u01d0" # й
204
+ "\u043A": "k" # к
205
+ "\u043B": "l" # л
206
+ "\u043C": "m" # м
207
+ "\u043D": "n" # н
208
+ "\u043E": "o" # о
209
+ "\u043F": "p" # п
210
+ "\u0440": "r" # р
211
+ "\u0441": "s" # с
212
+ "\u0442": "t" # т
213
+ "\u0443": "u" # у
214
+ "\u0444": "f" # ф
215
+ "\u0445": "kh" # х
216
+ "\u0446": "t\u0361s" # ц
217
+ "\u0447": "ch" # ч
218
+ "\u0448": "sh" # ш
219
+ "\u0449": "shch" # щ
220
+ "\u044A": "ʺ" # ъ
221
+ "\u044B": "y" # ы
222
+ "\u044C": "ʹ" # ь
223
+ "\u044D": "e\u0307" # э
224
+ "\u044E": "i\u0361u" # ю
225
+ "\u044F": "i\u0361a" # я
@@ -0,0 +1,162 @@
1
+ ---
2
+ authority_id: alalc
3
+ id: 2012
4
+ language: iso-639-2:rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: ALA-LC Romanization System 2012
8
+ url: https://www.loc.gov/catdir/cpso/romanization/russian.pdf
9
+ creation_date: 2012
10
+ description: |
11
+ The ALA-LC Romanization tables for Slavic alphabets is a set of standards for romanization of texts
12
+ in various writing systems used in North American libraries and publications.
13
+ The latest version was published by the American Library Association and the Library of Congress in 2012.
14
+
15
+ notes:
16
+ - The letters І, Ѣ, Ѳ and Ѵ were eliminated in the orthographic reform of 1918. For other obsolete letters appearing in Russian texts, consult the Church Slavic table.
17
+
18
+ tests:
19
+ - source: Азов
20
+ expected: Azov
21
+ - source: Тамбов
22
+ expected: Tambov
23
+ - source: Барнаул
24
+ expected: Barnaul
25
+ - source: Кубань
26
+ expected: Kubanʹ
27
+ - source: Владимир
28
+ expected: Vladimir
29
+ - source: Ульяновск
30
+ expected: Ulʹi͡anovsk
31
+ - source: Грозный
32
+ expected: Groznyǐ
33
+ - source: Волгодонск
34
+ expected: Volgodonsk
35
+ - source: Дзержинский
36
+ expected: Dzerzhinskiǐ
37
+ - source: Нелидово
38
+ expected: Nelidovo
39
+ - source: Елизово
40
+ expected: Elizovo
41
+ - source: Чебоксары
42
+ expected: Cheboksary
43
+ - source: Ёлкин
44
+ expected: Ëlkin
45
+ - source: Озёрный
46
+ expected: Ozërnyǐ
47
+ - source: Жуков
48
+ expected: Zhukov
49
+ - source: Лужники
50
+ expected: Luzhniki
51
+ - source: Звенигород
52
+ expected: Zvenigorod
53
+ - source: Вязьма
54
+ expected: Vi͡azʹma
55
+ - source: Иркутск
56
+ expected: Irkutsk
57
+ - source: Апатиты
58
+ expected: Apatity
59
+ - source: Йошкар-Ола
60
+ expected: Ǐoshkar-Ola
61
+ - source: Бийск
62
+ expected: Biǐsk
63
+ - source: Киров
64
+ expected: Kirov
65
+ - source: Енисейск
66
+ expected: Eniseǐsk
67
+ - source: Ломоносов
68
+ expected: Lomonosov
69
+ - source: Нелидово
70
+ expected: Nelidovo
71
+ - source: Менделеев
72
+ expected: Mendeleev
73
+ - source: Каменка
74
+ expected: Kamenka
75
+ - source: Новосибирск
76
+ expected: Novosibirsk
77
+ - source: Кандалакша
78
+ expected: Kandalaksha
79
+ - source: Омск
80
+ expected: Omsk
81
+ - source: Красноярск
82
+ expected: Krasnoi͡arsk
83
+ - source: Петрозаводск
84
+ expected: Petrozavodsk
85
+ - source: Серпухов
86
+ expected: Serpukhov
87
+ - source: Ростов
88
+ expected: Rostov
89
+ - source: Северобайкальск
90
+ expected: Severobaǐkalʹsk
91
+ - source: Сковородино
92
+ expected: Skovorodino
93
+ - source: Чайковский
94
+ expected: Chaǐkovskiǐ
95
+ - source: Тамбов
96
+ expected: Tambov
97
+ - source: Мытищи
98
+ expected: Mytishchi
99
+ - source: Углич
100
+ expected: Uglich
101
+ - source: Дудинка
102
+ expected: Dudinka
103
+ - source: Фурманов
104
+ expected: Furmanov
105
+ - source: Уфа
106
+ expected: Ufa
107
+ - source: Хабаровск
108
+ expected: Khabarovsk
109
+ - source: Прохладный
110
+ expected: Prokhladnyǐ
111
+ - source: Цимлянск
112
+ expected: T͡Simli͡ansk
113
+ - source: Ельцин
114
+ expected: Elʹt͡sin
115
+ - source: Чебоксары
116
+ expected: Cheboksary
117
+ - source: Печора
118
+ expected: Pechora
119
+ - source: Шахтёрск
120
+ expected: Shakhtërsk
121
+ - source: Мышкин
122
+ expected: Myshkin
123
+ - source: Щёлково
124
+ expected: Shchëlkovo
125
+ - source: Ртищево
126
+ expected: Rtishchevo
127
+ - source: Подъездной
128
+ expected: Podʺezdnoǐ
129
+ - source: Ыттык-Кёль
130
+ expected: Yttyk-Këlʹ
131
+ - source: Тында
132
+ expected: Tynda
133
+ - source: Тюмень
134
+ expected: Ti͡umenʹ
135
+ - source: Электрогорск
136
+ expected: Ėlektrogorsk
137
+ - source: Радиоэлектроника
138
+ expected: Radioėlektronika
139
+ - source: Юбилейный
140
+ expected: I͡Ubileǐnyǐ
141
+ - source: Ключевская
142
+ expected: Kli͡uchevskai͡a
143
+ - source: Якутск
144
+ expected: I͡Akutsk
145
+ - source: Брянск
146
+ expected: Bri͡ansk
147
+
148
+ map:
149
+ inherit: alalc-rus-Cyrl-Latn-1997
150
+
151
+ characters:
152
+ '\u0406': "\u012A"
153
+ '\u0456': "\u012B"
154
+
155
+ '\u0462': "I\u0361E" # Ѣ
156
+ '\u0463': "i\u0361e" # ѣ
157
+
158
+ '\u0472': "F\u0307" # Ѳ
159
+ '\u0473': "f\u0307" # ѳ
160
+
161
+ '\u0474': "Y\u0307" # Ѵ
162
+ '\u0475': "y\u0307" # ѵ