interscript 0.1.2 → 0.1.7

Sign up to get free protection for your applications and to get access to all the features.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,19 @@
1
+ ---
2
+ authority_id: elot
3
+ id: 2001-tl
4
+ language: iso-639-2:ell
5
+ source_script: Grek
6
+ destination_script: Latn
7
+ name: ELOT 743:2001
8
+ url: https://docplayer.gr/docview/18/849832/#file=/storage/18/849832/849832.pdf
9
+ creation_date: 2001
10
+ description: |
11
+ Reversible transliteration standard, ELOT
12
+
13
+ note:
14
+ - Transliteration standard (reversible): Clause 3.1, Table 1
15
+
16
+ map:
17
+ character_separator: ""
18
+ word_separator: " "
19
+ inherit: "iso-ell-Grek-Latn-843-1997-t1"
@@ -0,0 +1,31 @@
1
+ ---
2
+ authority_id: elot
3
+ id: 2001-ts
4
+ language: iso-639-2:ell
5
+ source_script: Grek
6
+ destination_script: Latn
7
+ name: ELOT 743:2001
8
+ url: https://docplayer.gr/docview/18/849832/#file=/storage/18/849832/849832.pdf
9
+ creation_date: 2001
10
+ description: |
11
+ Reversible transliteration standard, ELOT
12
+
13
+ note:
14
+ - Transcription standard (reversible): Clause 3.1, Table 2
15
+
16
+ tests:
17
+
18
+ - source: |
19
+ Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
20
+
21
+ Γιάννης Μακρυγιάννης.
22
+
23
+ expected: |
24
+ Éna práma mónon me parakínise ki eména na grápso óti toútin tin patrída tin échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai ftochoí kai politikoí kai stratiotikoí kai oi pléon mikróteroi ánthropoi; ósoi agonistíkamen, analógos o katheís, échomen na zísomen edó. To loipón doulépsamen óloi mazí, na tin fylámen ki óloi mazí kai na min légei oúte o dynatós «egó» oúte o adýnatos. Xérete póte na légei o katheís «egó»? Ótan agonisteí mónos tou kai fkiásei í chalásei, na légei «egó»; ótan ómos agonízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egó». Kai eis to exís na máthomen gnósi, an thélomen na fkiásomen chorión, na zísomen óloi mazí.
25
+
26
+ Giánnis Makrygiánnis.
27
+
28
+ map:
29
+ character_separator: ""
30
+ word_separator: " "
31
+ inherit: "iso-ell-Grek-Latn-843-1997-t2"
@@ -0,0 +1,92 @@
1
+ ---
2
+ authority_id: ggg
3
+ id: 2002
4
+ language: iso-639-2:kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: Georgian State Department of Geodesy and Cartography 2002 System
8
+ alias:
9
+ ogc11122:
10
+ code: kat_Geor2Latn_GGG_2002
11
+ description: Georgian State Department of Geodesy and Cartography 2002 System
12
+ url: https://transliteration.eki.ee/pdf/Georgian.pdf
13
+ creation_date: 1998
14
+ confirmation_date: 2002
15
+ description: |
16
+ The national system of romanization adopted in February 2002 by the State
17
+ Department of Geodesy and Cartography of Georgia and the Institute
18
+ of Linguistics, Georgian Academy of Sciences.
19
+
20
+ notes:
21
+ - Georgian script refers in this document to the Mkhedruli alphabet.
22
+
23
+ - There is no case in Georgian.
24
+
25
+ tests:
26
+ - source: თბილისი
27
+ expected: tbilisi
28
+
29
+ - source: მეღვინეთუხუცესი
30
+ expected: meghvinetukhutsesi
31
+
32
+ - source: ჭიანჭველა
33
+ expected: ch’ianch’vela
34
+
35
+ - source: ბაყაყი
36
+ expected: baq’aq’i
37
+
38
+ - source: ჩხალთის ქედი
39
+ expected: chkhaltis kedi
40
+
41
+ - source: აბჟააფთრა
42
+ expected: abzhaaptra
43
+
44
+ - source: ამბროლაურის მუნიციპალიტეტი
45
+ expected: ambrolauris munitsip’alit’et’i
46
+
47
+ - source: მარტვილის მუნიციპალიტეტი
48
+ expected: mart’vilis munitsip’alit’et’i
49
+
50
+ - source: ლეკუხონა
51
+ expected: lek’ukhona
52
+
53
+ - source: მყინვარი აღმოსავლეთი მაგუაშირხა
54
+ expected: mq’invari aghmosavleti maguashirkha
55
+
56
+
57
+
58
+ map:
59
+ characters:
60
+ '\u10d0' : 'a' # ა
61
+ '\u10d1' : 'b' # ბ
62
+ '\u10d2' : 'g' # გ
63
+ '\u10d3' : 'd' # დ
64
+ '\u10d4' : 'e' # ე
65
+ '\u10d5' : 'v' # ვ
66
+ '\u10d6' : 'z' # ზ
67
+ '\u10d7' : 't' # თ
68
+ '\u10d8' : 'i' # ი
69
+ '\u10d9' : 'k’' # კ
70
+ '\u10da' : 'l' # ლ
71
+ '\u10db' : 'm' # მ
72
+ '\u10dc' : 'n' # ნ
73
+ '\u10dd' : 'o' # ო
74
+ '\u10de' : 'p’' # პ
75
+ '\u10df' : 'zh' # ჟ
76
+ '\u10e0' : 'r' # რ
77
+ '\u10e1' : 's' # ს
78
+ '\u10e2' : 't’' # ტ
79
+ '\u10e3' : 'u' # უ
80
+ '\u10e4' : 'p' # ფ
81
+ '\u10e5' : 'k' # ქ
82
+ '\u10e6' : 'gh' # ღ
83
+ '\u10e7' : 'q’' # ყ
84
+ '\u10e8' : 'sh' # შ
85
+ '\u10e9' : 'ch' # ჩ
86
+ '\u10ea' : 'ts' # ც
87
+ '\u10eb' : 'dz' # ძ
88
+ '\u10ec' : 'ts’' # წ
89
+ '\u10ed' : 'ch’' # ჭ
90
+ '\u10ee' : 'kh' # ხ
91
+ '\u10ef' : 'j' # ჯ
92
+ '\u10f0' : 'h' # ჰ
@@ -0,0 +1,33 @@
1
+ ---
2
+ authority_id: gki
3
+ id: 1992
4
+ language: iso-639-2:bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: Byelorussian National Cartographic Authority 1992-3 System (based on GOST 1983)
8
+ url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/7th-uncsgn-docs/econf/7th_UNCSGN_econf.91_3_Add1.pdf
9
+ creation_date: 1992
10
+
11
+ tests:
12
+ - source: 'Сямашкі'
13
+ expected: 'Sjamaški'
14
+ # "Syamashki" in GNDB `bel_Cyrl2Latn_GBO_1992`, but that is clearly bgnpcgn-ukr-Cyrl-Latn-1965
15
+ - source: 'Старадворцы'
16
+ expected: 'Staradvorcy'
17
+ # "Staradvortsy" in GNDB `bel_Cyrl2Latn_GBO_1992`, but that is clearly bgnpcgn-ukr-Cyrl-Latn-1965
18
+ - source: 'Канюхі'
19
+ expected: 'Kanjuhi'
20
+ # "Kanyukhi" in GNDB `bel_Cyrl2Latn_GBO_1992`, but that is clearly bgnpcgn-ukr-Cyrl-Latn-1965
21
+
22
+ map:
23
+ inherit: gost-rus-Cyrl-Latn-16876-71-1983
24
+
25
+ characters:
26
+ '\u0406' : 'I' # І
27
+ '\u0456' : 'i' # і
28
+
29
+ '\u0413' : 'G' # Г
30
+ '\u0433' : 'g' # г
31
+
32
+ '\U040E' : 'Ŭ' # Ў
33
+ '\u045E' : 'ŭ' # ў
@@ -0,0 +1,201 @@
1
+ ---
2
+ authority_id: gki
3
+ id: 2000
4
+ language: iso-639-2:bel
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: On approval of the Instructions for the transliteration of geographical names of the Republic of Belarus with letters of the Latin alphabet
8
+ url: https://registr.by/doc/103003
9
+ creation_date: 2000
10
+ description: |
11
+ Act name:
12
+ On approval of the Instructions for the transliteration of geographical names of
13
+ the Republic of Belarus in letters of the Latin alphabet
14
+ Type of act, adoption authority, date and number of adoption (publication):
15
+ Resolution of the State Committee for Land Resources, Geodesy and Cartography of
16
+ the Republic of Belarus of November 23, 2000 No. 15
17
+ National Registry Registration Number: 8/4488
18
+ Date of inclusion in the National Register: 11/30/2000
19
+ Source (s) of official publication:
20
+ National Register of Legal Acts of the Republic of Belarus, 2001,
21
+ No. 3, 8/4488 (published - January 11, 2001)
22
+ tests:
23
+ - source: Аршанскi
24
+ expected: Aršanski
25
+ - source: Бешанковічы
26
+ expected: Biešankovičy
27
+ - source: Віцебск
28
+ expected: Viciebsk
29
+ - source: Гомель
30
+ expected: Homiel'
31
+ - source: Гаўя
32
+ expected: Haŭja
33
+ - source: Добруш
34
+ expected: Dobruš
35
+ - source: Ельск
36
+ expected: Jel'sk
37
+ - source: Бабаедава
38
+ expected: Babajedava
39
+ - source: Лепель
40
+ expected: Liepiel'
41
+ - source: Ёды
42
+ expected: Jody
43
+ - source: Вераб'ёвічы
44
+ expected: Vierabjovičy
45
+ - source: Мёры
46
+ expected: Miory
47
+ - source: Жодзiшкi
48
+ expected: Žodziški
49
+ - source: Зэльва
50
+ expected: Zel'va
51
+ - source: Iванава
52
+ expected: Ivanava
53
+ - source: Iўе
54
+ expected: Iŭje
55
+ - source: Лагойск
56
+ expected: Lahojsk
57
+ - source: Круглае
58
+ expected: Kruhlaje
59
+ - source: Любань
60
+ expected: Liuban'
61
+ - source: Магілёў
62
+ expected: Mahilioŭ
63
+ - source: Нясвіж
64
+ expected: Niasviž
65
+ - source: Орша
66
+ expected: Orša
67
+ - source: Паставы
68
+ expected: Pastavy
69
+ - source: Рагачоў
70
+ expected: Rahačoŭ
71
+ - source: Светлагорск
72
+ expected: Svietlahorsk # original doc Svetlahorsk but it looks like mistake https://en.wikipedia.org/wiki/Svietlahorsk
73
+ - source: Талачын
74
+ expected: Talačyn
75
+ - source: Узда
76
+ expected: Uzda
77
+ - source: Шаркаўшчына
78
+ expected: Šarkaŭščyna
79
+ - source: Фаніпаль
80
+ expected: Fanipal'
81
+ - source: Хоцімск
82
+ expected: Chocimsk
83
+ - source: Цёмны Лес
84
+ expected: Ciomny Lies
85
+ - source: Чавусы
86
+ expected: Čavusy
87
+ - source: Шумілiна
88
+ expected: Šumilina
89
+ - source: Раз'езд
90
+ expected: Razjezd
91
+ - source: Чыгірынка
92
+ expected: Čyhirynka
93
+ - source: Чэрвень
94
+ expected: Červien'
95
+ - source: Чачэрск
96
+ expected: Čačersk
97
+ - source: Юхнаўка
98
+ expected: Juchnaŭka
99
+ - source: Гаюціна
100
+ expected: Hajucina
101
+ - source: Любонічы
102
+ expected: Liuboničy
103
+ - source: Ямнае
104
+ expected: Jamnaje
105
+ - source: Баяры
106
+ expected: Bajary
107
+ - source: Вязынка
108
+ expected: Viazynka
109
+ - source: Валяр'яны
110
+ expected: Valiarjany
111
+
112
+ map:
113
+ rules:
114
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0415 # Е after consonants
115
+ result: IE
116
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0435 # е after consonants
117
+ result: ie
118
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0401 # Ё after consonants
119
+ result: IO
120
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u0451 # ё after consonants
121
+ result: io
122
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u042E # Ю after consonants
123
+ result: IU
124
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u044E # ю after consonants
125
+ result: iu
126
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u042F # Я after consonants
127
+ result: IA
128
+ - pattern: (?<=[БбВвГгДдЖжЗзЙйКкЛлМмНнПпРрСсТтФфХхЦцЧчШш])\u044F # я after consonants
129
+ result: ia
130
+ postrules:
131
+ - pattern: '\u042C' # Ь
132
+ result: "'"
133
+ - pattern: '\u044C' # ь
134
+ result: "'"
135
+
136
+ characters:
137
+ '\u0027' : '' # '
138
+
139
+ '\u0410' : 'A' # A
140
+ '\u0411' : 'B' # Б
141
+ '\u0412' : 'V' # B
142
+ '\u0413' : 'H' # Г
143
+ '\u0414' : 'D' # Д
144
+ '\u0415' : 'Je' # Е
145
+ '\u0401' : 'Jo' # Ё
146
+ '\u0416' : 'Ž' # Ж
147
+ '\u0417' : 'Z' # З
148
+ '\u0406' : 'I' # І
149
+ '\u0419' : 'J' # Й
150
+ '\u041A' : 'K' # К
151
+ '\u041B' : 'L' # Л
152
+ '\u041C' : 'M' # М
153
+ '\u041D' : 'N' # Н
154
+ '\u041E' : 'O' # О
155
+ '\u041F' : 'P' # П
156
+ '\u0420' : 'R' # Р
157
+ '\u0421' : 'S' # С
158
+ '\u0422' : 'T' # Т
159
+ '\u0423' : 'U' # У
160
+ '\U040E' : 'Ŭ' # Ў
161
+ '\u0424' : 'F' # Ф
162
+ '\u0425' : 'Ch' # Х
163
+ '\u0426' : 'C' # Ц
164
+ '\u0427' : 'Č' # Ч
165
+ '\u0428' : 'Š' # Ш
166
+ '\u042B' : 'Y' # Ы
167
+ '\u042D' : 'E' # Э
168
+ '\u042E' : 'Ju' # Ю
169
+ '\u042F' : 'Ja' # Я
170
+
171
+ '\u0430' : 'a' # а
172
+ '\u0431' : 'b' # б
173
+ '\u0432' : 'v' # в
174
+ '\u0433' : 'h' # г
175
+ '\u0434' : 'd' # д
176
+ '\u0435' : 'je' # е
177
+ '\u0451' : 'jo' # ё
178
+ '\u0436' : 'ž' # ж
179
+ '\u0437' : 'z' # з
180
+ '\u0456' : 'i' # і
181
+ '\u0439' : 'j' # й
182
+ '\u043A' : 'k' # к
183
+ '\u043B' : 'l' # л
184
+ '\u043C' : 'm' # м
185
+ '\u043D' : 'n' # н
186
+ '\u043E' : 'o' # о
187
+ '\u043F' : 'p' # п
188
+ '\u0440' : 'r' # р
189
+ '\u0441' : 's' # с
190
+ '\u0442' : 't' # т
191
+ '\u0443' : 'u' # у
192
+ '\u045E' : 'ŭ' # ў
193
+ '\u0444' : 'f' # ф
194
+ '\u0445' : 'ch' # х
195
+ '\u0446' : 'c' # ц
196
+ '\u0447' : 'č' # ч
197
+ '\u0448' : 'š' # ш
198
+ '\u044B' : 'y' # ы
199
+ '\u044D' : 'e' # э
200
+ '\u044E' : 'ju' # ю
201
+ '\u044F' : 'ja' # я
@@ -0,0 +1,190 @@
1
+ ---
2
+ authority_id: gost
3
+ id: 1983
4
+ language: iso-639-2:rus
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: LETTERS TRANSLATION RULES OF KIRILLOVSKY ALPHABET WITH LETTERS OF LATIN ALPHABET GOST 16876-71
8
+ alias:
9
+ ogc11122:
10
+ code: rus_Cyrl2Latn_GOST_1983
11
+ description: Russian GOST 1983 System, Main Administration of Geodesy and Cartography of the Former Soviet Union
12
+ url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/7th-uncsgn-docs/econf/7th_UNCSGN_econf.91_3_Add1.pdf
13
+ creation_date: 1978
14
+ confirmation_date: 1982-04-16
15
+ adoption_date: 1983-05-13
16
+ description: |
17
+ GOST 16876-71 (Russian: ГОСТ 16876-71) is a romanization system (for transliteration of Russian Cyrillic alphabet texts into the Latin alphabet)
18
+ devised by the National Administration for Geodesy and Cartography of the Soviet Union.
19
+ It is based on the scientific transliteration system used in linguistics.
20
+ GOST was an international standard so it included provision for a number of the languages
21
+ of the Soviet Union.
22
+
23
+ GOST 16876-71 was used by the United Nations to develop its romanization system for geographical names,
24
+ which was adopted for official use by the United Nations at the Fifth United Nations Conference
25
+ on the Standardization of Geographical Names in Montreal, Quebec, Canada, in 1987.
26
+ UN system relies on diacritics to compensate for non-Russian Cyrillic alphabets.
27
+
28
+ In 1978, COMECON adopted GOST 16876-71 with minor modifications as its official transliteration standard,
29
+ under the name of SEV 1362-78 (Russian: СЭВ 1362-78).
30
+
31
+ In 1982, In accordance with Order No. 169 of April 16, 1982, GOST 16876-71 / ST SEV 1362-78 was put into effect on May 1, 1982.
32
+
33
+ In 1983, In accordance with Order No. 231 of May 16, 1983, Additional guidelines was released (check notes[2])
34
+
35
+ In 2002, the Russian Federation along with a number of CIS countries abandoned the use of GOST 16876
36
+ in favor of ISO 9:1995, which was adopted as GOST 7.79-2000.
37
+
38
+ notes:
39
+ - http://vsegost.com/Catalog/45/45002.shtml - original GOST
40
+ - https://rosreestr.ru/upload/documenty/doc_169.doc - orders for entry into force (with changes)
41
+
42
+ tests:
43
+ - source: Анапа
44
+ expected: Anapa
45
+ - source: Бабушкин
46
+ expected: Babuškin
47
+ - source: Вавилово
48
+ expected: Vavilovo
49
+ - source: Гагарин
50
+ expected: Gagarin
51
+ - source: Дудинка
52
+ expected: Dudinka
53
+ - source: Елисеевка
54
+ expected: Eliseevka
55
+ - source: Ёлкино
56
+ expected: Ëlkino
57
+ - source: Псёл
58
+ expected: Psël
59
+ - source: Жужа
60
+ expected: Žuža
61
+ - source: Звёздный
62
+ expected: Zvëzdnyj
63
+ - source: Идрица
64
+ expected: Idrica
65
+ - source: Зарайск
66
+ expected: Zarajsk
67
+ - source: Коканд
68
+ expected: Kokand
69
+ - source: Лалвар
70
+ expected: Lalvar
71
+ - source: Маймак
72
+ expected: Majmak
73
+ - source: Нежин
74
+ expected: Nežin
75
+ - source: Ободовка
76
+ expected: Obodovka
77
+ - source: Пап
78
+ expected: Pap
79
+ - source: Ребриха
80
+ expected: Rebriha
81
+ - source: Сасово
82
+ expected: Sasovo
83
+ - source: Татта
84
+ expected: Tatta
85
+ - source: Уржум
86
+ expected: Uržum
87
+ - source: Фофаново
88
+ expected: Fofanovo
89
+ - source: Хохлома
90
+ expected: Hohloma
91
+ - source: Цветково
92
+ expected: Cvetkovo
93
+ - source: Чечельник
94
+ expected: Čečel´nik
95
+ - source: Шишкино
96
+ expected: Šiškino
97
+ - source: Щукино
98
+ expected: Ščukino
99
+ - source: Подъячево
100
+ expected: Pod"jačevo
101
+ - source: Ыныкчанский
102
+ expected: Ynykčanskij
103
+ - source: Параньга
104
+ expected: Paran´ga
105
+ - source: Щучье
106
+ expected: Ščuč´e
107
+ - source: Элиста
108
+ expected: Èlista
109
+ - source: Юрино
110
+ expected: Jurino
111
+ - source: Юхнов
112
+ expected: Juhnov
113
+ - source: Юрюзань
114
+ expected: Jurjuzan´
115
+ - source: Ямал
116
+ expected: Jamal
117
+ - source: Язъяван
118
+ expected: Jaz"javan
119
+ - source: Яя
120
+ expected: Jaja
121
+
122
+ map:
123
+ characters:
124
+ '\u0410' : 'A' # A
125
+ '\u0411' : 'B' # Б
126
+ '\u0412' : 'V' # B
127
+ '\u0413' : 'G' # Г
128
+ '\u0414' : 'D' # Д
129
+ '\u0415' : 'E' # Е
130
+ '\u0401' : "\u00CB" # Ё
131
+ '\u0416' : 'Ž' # Ж
132
+ '\u0417' : 'Z' # З
133
+ '\u0418' : "I" # И
134
+ '\u0419' : 'J' # Й
135
+ '\u041A' : 'K' # К
136
+ '\u041B' : 'L' # Л
137
+ '\u041C' : 'M' # М
138
+ '\u041D' : 'N' # Н
139
+ '\u041E' : 'O' # О
140
+ '\u041F' : 'P' # П
141
+ '\u0420' : 'R' # Р
142
+ '\u0421' : 'S' # С
143
+ '\u0422' : 'T' # Т
144
+ '\u0423' : 'U' # У
145
+ '\u0424' : 'F' # Ф
146
+ '\u0425' : 'H' # Х
147
+ '\u0426' : 'C' # Ц
148
+ '\u0427' : 'Č' # Ч
149
+ '\u0428' : 'Š' # Ш
150
+ '\u0429' : 'Šč' # Щ
151
+ '\u042a' : '"' # Ъ
152
+ '\u042B' : 'Y' # Ы
153
+ '\u042C' : "\u00B4" # Ь => ’
154
+ '\u042D' : "E\u0300" # Э => È
155
+ '\u042E' : 'Ju' # Ю
156
+ '\u042F' : 'Ja' # Я
157
+
158
+ '\u0430' : 'a' # а
159
+ '\u0431' : 'b' # б
160
+ '\u0432' : 'v' # в
161
+ '\u0433' : 'g' # г
162
+ '\u0434' : 'd' # д
163
+ '\u0435' : 'e' # е
164
+ '\u0451' : "\u00EB" # ё
165
+ '\u0436' : 'ž' # ж
166
+ '\u0437' : 'z' # з
167
+ '\u0438' : 'i' # и
168
+ '\u0439' : 'j' # й
169
+ '\u043A' : 'k' # к
170
+ '\u043B' : 'l' # л
171
+ '\u043C' : 'm' # м
172
+ '\u043D' : 'n' # н
173
+ '\u043E' : 'o' # о
174
+ '\u043F' : 'p' # п
175
+ '\u0440' : 'r' # р
176
+ '\u0441' : 's' # с
177
+ '\u0442' : 't' # т
178
+ '\u0443' : 'u' # у
179
+ '\u0444' : 'f' # ф
180
+ '\u0445' : 'h' # х
181
+ '\u0446' : 'c' # ц
182
+ '\u0447' : 'č' # ч
183
+ '\u0448' : 'š' # ш
184
+ '\u0449' : 'šč' # щ
185
+ '\u044A' : '"' # ъ
186
+ '\u044B' : 'y' # ы
187
+ '\u044C' : "\u00B4" # ь => ’
188
+ '\u044D' : "e\u0300" # э => è
189
+ '\u044E' : 'ju' # ю
190
+ '\u044F' : 'ja' # я