interscript 0.1.2 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. checksums.yaml +4 -4
  2. data/README.adoc +250 -17
  3. data/lib/g2pwrapper.py +34 -0
  4. data/lib/interscript.rb +142 -20
  5. data/lib/interscript/command.rb +28 -0
  6. data/lib/interscript/fs.rb +69 -0
  7. data/lib/interscript/mapping.rb +142 -0
  8. data/lib/interscript/opal.rb +57 -0
  9. data/lib/interscript/opal/entrypoint.rb +12 -0
  10. data/lib/interscript/opal/map_translate.rb +7 -0
  11. data/lib/interscript/opal/maps.js.erb +10 -0
  12. data/lib/interscript/version.rb +1 -1
  13. data/lib/model-7 +0 -0
  14. data/lib/tha-pt-b-7 +0 -0
  15. data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
  16. data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
  17. data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
  18. data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
  19. data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
  20. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  21. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
  22. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
  23. data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
  24. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
  25. data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
  26. data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
  27. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  28. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  29. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  30. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  31. data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
  32. data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
  33. data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
  34. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  35. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  36. data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
  37. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  38. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
  39. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
  40. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  41. data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
  42. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  43. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  44. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  45. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  46. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
  47. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
  48. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  49. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  50. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  51. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
  52. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
  53. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  54. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  55. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
  56. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
  57. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
  58. data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
  59. data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
  60. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
  61. data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
  62. data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
  63. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
  64. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
  65. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
  66. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
  67. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
  68. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
  69. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
  70. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
  71. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
  72. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
  73. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  74. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
  75. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
  76. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
  77. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
  78. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
  79. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
  80. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
  81. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
  82. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
  83. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
  84. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
  85. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  86. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
  87. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  88. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  89. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  90. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  91. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
  92. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
  93. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  94. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  95. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
  96. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
  97. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  98. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  99. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
  100. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
  101. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
  102. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
  103. data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
  104. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
  105. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
  106. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
  107. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
  108. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
  109. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
  110. data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
  111. data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
  112. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  113. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  114. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  115. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  116. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  117. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  118. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  119. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  120. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  121. data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
  122. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
  123. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
  124. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
  125. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
  126. data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
  127. data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
  128. data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
  129. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
  130. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  131. data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
  132. data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
  133. data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
  134. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
  135. data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
  136. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
  137. data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
  138. data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
  139. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
  140. data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
  141. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  142. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  143. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
  144. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
  145. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  146. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  147. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  148. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
  149. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  150. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  151. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  152. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  153. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  154. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  155. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  156. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  157. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  158. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  159. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  160. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  161. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  162. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  163. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  164. data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
  165. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  166. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  167. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  168. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
  169. data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
  170. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
  171. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
  172. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  173. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  174. data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
  175. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
  176. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
  177. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
  178. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
  179. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
  180. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  181. data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
  182. data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
  183. data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
  184. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  185. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  186. data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
  187. data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
  188. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
  189. data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
  190. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  191. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
  192. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  193. data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
  194. data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
  195. data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
  196. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
  197. data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
  198. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
  199. data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
  200. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
  201. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
  202. data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
  203. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
  204. data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
  205. data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
  206. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  207. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  208. data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
  209. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
  210. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
  211. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  212. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  213. data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
  214. data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
  215. data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
  216. data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
  217. data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
  218. data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
  219. data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
  220. data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
  221. data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
  222. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  223. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  224. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  225. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  226. data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
  227. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  228. data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
  229. data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
  230. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  231. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  232. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
  233. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
  234. data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
  235. data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
  236. data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
  237. data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
  238. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  239. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  240. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  241. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  242. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  243. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  244. data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
  245. data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
  246. data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
  247. data/spec/interscript/filenames_spec.rb +384 -0
  248. data/spec/interscript/mapping_spec.rb +42 -0
  249. data/spec/interscript_spec.rb +23 -5
  250. data/spec/spec_helper.rb +3 -1
  251. metadata +364 -34
  252. data/bin/interscript +0 -20
  253. data/bin/rspec +0 -29
  254. data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
  255. data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
  256. data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
  257. data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
  258. data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
  259. data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
  260. data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
  261. data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,23 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1996
4
+ language: iso-639-2:ell
5
+ source_script: Grek
6
+ destination_script: Latn
7
+ name: BGN/PCGN 1996 System
8
+ alias:
9
+ ogc11122:
10
+ code: ell_Grek2Latn_ELOT743_1996
11
+ description: Greek ELOT 743 System, US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1996 agreement
12
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693694/ROMANIZATION_OF_GREEK.pdf
13
+ creation_date: 1996
14
+ description: |
15
+ BGN/PCGN Romanization table for Greek
16
+
17
+ note:
18
+ - Identical to ELOT 743:1982, which is also adopted as ISO 843:1997 and by UNGEGN
19
+
20
+ map:
21
+ character_separator: ""
22
+ word_separator: " "
23
+ inherit: "elot-ell-Grek-Latn-743-1982-ts"
@@ -3,10 +3,14 @@
3
3
  # TODO: Add tests from PDF
4
4
  authority_id: bgnpcgn
5
5
  id: 1956
6
- language: per
6
+ language: iso-639-2:fas
7
7
  source_script: Arab
8
8
  destination_script: Latn
9
9
  name: BGN/PCGN 1956 System
10
+ alias:
11
+ ogc11122:
12
+ code: fas_Arab2Latn_BGN_1958
13
+ description: Persian (Afghan and Iranian) BGN/Permanent Committee on Geographical Names for British Official Use(PCGN) 1958 System
10
14
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/320079/Arabic_Romanization.pdf
11
15
  creation_date: 1947
12
16
  confirmation_date: 2019-06
@@ -90,4 +94,3 @@ map:
90
94
  '\u0647' : 'h'
91
95
  '\u0648' : 'v'
92
96
  '\u0649' : 'y'
93
-
@@ -0,0 +1,257 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1930
4
+ language: iso-639-2:jpn
5
+ source_script: Hrkt
6
+ destination_script: Latn
7
+ name: Japanese Kana Modified Hepburn 1930 System
8
+ url:
9
+ creation_date:
10
+ adoption_date:
11
+ description:
12
+
13
+ notes:
14
+ - Segmentation needs to be done before using this map
15
+ - Note 5 in the specification states that when identical repeating vowels
16
+ belong to different kanji characters, they shall be romanized
17
+ individually and an apostrophe (’) shall be placed between the vowels.
18
+ However since this is a map from Kana to Hepburn, there is no way to
19
+ implement this feature.
20
+ - The documentation did not specify how the hyphen should be used.
21
+
22
+ tests:
23
+
24
+ - source: てがた-からみでん
25
+ expected: "Tegata-karamiden"
26
+ - source: てがた-すみよしちょう
27
+ expected: "Tegata-sumiyoshichō"
28
+ - source: さいのはま
29
+ expected: "Sainohama"
30
+ - source: てがた-たなか
31
+ expected: "Tegata-tanaka"
32
+ - source: ほりおでん
33
+ expected: "Horioden"
34
+ - source: そえがわ
35
+ expected: "Soegawa"
36
+ - source: ふねがさわ
37
+ expected: "Funegasawa"
38
+ - source: とくまんだて
39
+ expected: "Tokumandate"
40
+ - source: たてない
41
+ expected: "Tatenai"
42
+ - source: つるがさき
43
+ expected: "Tsurugasaki"
44
+ - source: しもやつせ
45
+ expected: "Shimoyatsuse"
46
+ - source: かみやつせ
47
+ expected: "Kamiyatsuse"
48
+ - source: しんとうだ
49
+ expected: "Shintōda"
50
+ - source: かじのめ
51
+ expected: "Kajinome"
52
+ - source: まえぎ
53
+ expected: "Maegi"
54
+ - source: くろさわ やま
55
+ expected: "Kurosawa Yama"
56
+ - source: いちのさわ がわ
57
+ expected: "Ichinosawa Gawa"
58
+ - source: はちやまえ
59
+ expected: "Hachiyamae"
60
+ - source: やち
61
+ expected: "Yachi"
62
+ - source: たてぬま
63
+ expected: "Tatenuma"
64
+ - source: しらはま
65
+ expected: "Shirahama"
66
+ - source: けせんまち
67
+ expected: "Kesenmachi"
68
+ - source: けいだい-かわら
69
+ expected: "Keidai-kawara"
70
+ - source: いしやました
71
+ expected: "Ishiyamashita"
72
+ - source: なえひら-やち
73
+ expected: "Naehira-yachi"
74
+ - source: とみの
75
+ expected: "Tomino"
76
+ - source: あらや-たかみまち
77
+ expected: "Araya-takamimachi"
78
+ - source: ながた
79
+ expected: "Nagata"
80
+ - source: とどろき おんせん
81
+ expected: "Todoroki Onsen"
82
+ - source: かしわぎはら
83
+ expected: "Kashiwagihara"
84
+ - source: とやけもり やま
85
+ expected: "Toyakemori Yama"
86
+ - source: なかさい
87
+ expected: "Nakasai"
88
+ - source: たけした
89
+ expected: "Takeshita"
90
+ - source: みと
91
+ expected: "Mito"
92
+ - source: みなみなかさと
93
+ expected: "Minaminakasato"
94
+ - source: みずおし
95
+ expected: "Mizuoshi"
96
+ - source: なかさと
97
+ expected: "Nakasato"
98
+ - source: しんかりば
99
+ expected: "Shinkariba"
100
+ - source: しんかみぬま
101
+ expected: "Shinkaminuma"
102
+ - source: しんばし
103
+ expected: "Shinbashi"
104
+ - source: りくぜんやました えき
105
+ expected: "Rikuzen’yamashita Eki"
106
+ - source: うしじまにし
107
+ expected: "Ushijimanishi"
108
+ - source: はまえば
109
+ expected: "Hamaeba"
110
+ - source: ぬまむかい
111
+ expected: "Numamukai"
112
+ - source: さんげんやち
113
+ expected: "Sangen’yachi"
114
+ - source: にけんやち
115
+ expected: "Niken’yachi"
116
+ - source: やちなか
117
+ expected: "Yachinaka"
118
+ - source: なす がわ
119
+ expected: "Nasu Gawa"
120
+ - source: おおはらはま
121
+ expected: "Ōharahama"
122
+ - source: うるご がわ
123
+ expected: "Urugo Gawa"
124
+ - source: なかばせ
125
+ expected: "Nakabase"
126
+ - source: うと えき
127
+ expected: "Uto Eki"
128
+ - source: みずまち
129
+ expected: "Mizumachi"
130
+ - source: ごんげんどう
131
+ expected: "Gongendō"
132
+ - source: いとひさ
133
+ expected: "Itohisa"
134
+ - source: あらおい
135
+ expected: "Araoi"
136
+ - source: わんめ
137
+ expected: "Wanme"
138
+ - source: かじろ
139
+ expected: "Kajiro"
140
+ - source: みやばら
141
+ expected: "Miyabara"
142
+ - source: いまどみ
143
+ expected: "Imadomi"
144
+ - source: かいほ
145
+ expected: "Kaiho"
146
+ - source: かいほ ぼえん
147
+ expected: "Kaiho Boen"
148
+ - source: ひきだ
149
+ expected: "Hikida"
150
+ - source: あさい-こむかい
151
+ expected: "Asai-komukai"
152
+ - source: こうざか
153
+ expected: "Kōzaka"
154
+ - source: こうふうだい
155
+ expected: "Kōfūdai"
156
+ - source: たての
157
+ expected: "Tateno"
158
+ - source: センター
159
+ expected: "Sentā"
160
+ - source: フィリピン
161
+ expected: "Firipin"
162
+ - source: ヴィオリン
163
+ expected: "Viorin"
164
+ - source: クォーター
165
+ expected: "Kwōtā"
166
+ - source: パッチリ
167
+ expected: "Patchiri"
168
+ - source: ぽっぽっや
169
+ expected: "Poppoyya"
170
+
171
+ map:
172
+ character_separator: ""
173
+ word_separator: " "
174
+ title_case: True
175
+ inherit: var-jpn-Hrkt-Latn-hepburn-1954
176
+
177
+ characters:
178
+ # Rare sounds, Table 2 & 4
179
+
180
+ "くぁ": "kwa"
181
+ "クァ": "kwa"
182
+ "ぐぁ": "gwa"
183
+ "グァ": "gwa"
184
+ "くぃ": "kwi"
185
+ "クィ": "kwi"
186
+ "ぐぃ": "gwa"
187
+ "グィ": "gwa"
188
+ "きぇ": "kye"
189
+ "キェ": "kye"
190
+ "ぎぇ": "gye"
191
+ "ギェ": "gye"
192
+ "くぇ": "kwe"
193
+ "クェ": "kwe"
194
+ "ぐぇ": "gwe"
195
+ "グェ": "gwe"
196
+ "くぉ": "kwo"
197
+ "クォ": "kwo"
198
+ "ぐぉ": "gwo"
199
+ "グォ": "gwo"
200
+ "しぇ": "she"
201
+ "シェ": "she"
202
+ "じぇ": "je"
203
+ "ジェ": "je"
204
+ "つぁ": "tsa"
205
+ "ツァ": "tsa"
206
+ "てぃ": "ti"
207
+ "ティ": "ti"
208
+ "でぃ": "di"
209
+ "ディ": "di"
210
+ "てゅ": "tyu"
211
+ "テュ": "tyu"
212
+ "でゅ": "dyu"
213
+ "デュ": "dyu"
214
+ "とゅ": "tu"
215
+ "トュ": "tu"
216
+ "どゅ": "du"
217
+ "ドュ": "du"
218
+ "ちぇ": "che"
219
+ "チェ": "che"
220
+ "ぢぇ": "je"
221
+ "ヂェ": "je"
222
+ "つぇ": "tse"
223
+ "ツェ": "tse"
224
+ "つぉ": "tso"
225
+ "ツォ": "tso"
226
+ "にぇ": "nye"
227
+ "ニェ": "nye"
228
+ "ふぁ": "fa"
229
+ "ファ": "fa"
230
+ "ふぃ": "fi"
231
+ "フィ": "fi"
232
+ "ふぇ": "fe"
233
+ "フェ": "fe"
234
+ "ふぉ": "fo"
235
+ "フォ": "fo"
236
+ "みぇ": "mye"
237
+ "ミェ": "mye"
238
+ "ぃぇ": "ye"
239
+ "ィェ": "ye"
240
+ "りぇ": "rye"
241
+ "リェ": "rye"
242
+ "ゔぁ": "va"
243
+ "ヴァ": "va"
244
+ "うぃ": "wi"
245
+ "ウィ": "wi"
246
+ "ゔぃ": "vi"
247
+ "ヴィ": "vi"
248
+ "うぇ": "we"
249
+ "ウェ": "we"
250
+ "ゔぇ": "ve"
251
+ "ヴェ": "ve"
252
+ "うぉ": "wo"
253
+ "ウォ": "wo"
254
+ "ゔぉ": "vo"
255
+ "ヴォ": "vo"
256
+ "ゔ": "vu"
257
+ "ヴ": "vu"
@@ -0,0 +1,131 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1981
4
+ language: iso-639-2:kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF GEORGIAN; BGN/PCGN 1981 System
8
+ alias:
9
+ ogc11122:
10
+ code: kat_Geor2Latn_BGN_1981
11
+ description: Georgian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1981 System
12
+ url: https://transliteration.eki.ee/pdf/Georgian.pdf
13
+ creation_date: 1981
14
+ confirmation_date: 1981
15
+ description: |
16
+ BGN/PCGN system of 1981.
17
+
18
+ notes:
19
+
20
+ tests:
21
+ - source: ჰებუდი
22
+ expected: hebudi
23
+
24
+ - source: ჯვრის წყალსაცავი
25
+ expected: jvris tsqalsats’avi
26
+
27
+ - source: ჯვავიაკვარა
28
+ expected: jvaviak’vara
29
+
30
+ - source: ჯობრია
31
+ expected: jobria
32
+
33
+ - source: ძულუხირა
34
+ expected: dzulukhira
35
+
36
+ - source: ლეკუხონა
37
+ expected: lek’ukhona
38
+
39
+ - source: აბაშა
40
+ expected: abasha
41
+
42
+ - source: ააცი
43
+ expected: aats’i
44
+
45
+ # TODO: This belongs to which system?!
46
+ # - source: აბააჟახვუ
47
+ # expected: abaazhvakhu
48
+
49
+ # TODO: These examples from GNDB are clearly using the BGNPCGN 2009 system
50
+ #
51
+ # - source: ხობის მუნიციპალიტეტი
52
+ # expected: khobis munitsip’alit’et’i
53
+ #
54
+ # - source: მყინვარი ჩრდილოეთი ლეადაშატი
55
+ # expected: mq’invari chrdiloeti leadashat’i
56
+ #
57
+ # - source: ხეწკვარა
58
+ # expected: khets’k’vara
59
+ #
60
+ # - source: ჯამპალი
61
+ # expected: jamp’ali
62
+ #
63
+ # - source: ჯავის მუნიციპალიტეტი
64
+ # expected: javis munitsip’alit’et’i
65
+ #
66
+ # - source: ხოიჯგეთა
67
+ # expected: khoijgeta
68
+ #
69
+ # - source: ხობის მუნიციპალიტეტი
70
+ # expected: khobis munitsip’alit’et’i
71
+ #
72
+ # - source: წვიშარხუ
73
+ # expected: ts’visharkhu
74
+ # - source: აღმოსავლეთი გუმისთა
75
+ # expected: aghmosavleti gumista
76
+ #
77
+ # - source: ქვემო ბირცხა
78
+ # expected: kvemo birtskha
79
+ #
80
+ # - source: ზემო ბირცხა
81
+ # expected: zemo birtskha
82
+ #
83
+ # - source: აბჟაყვა
84
+ # expected: abzhaq’va
85
+
86
+
87
+
88
+ map:
89
+ characters:
90
+ '\u10d0' : 'a' # ა
91
+ '\u10d1' : 'b' # ბ
92
+ '\u10d2' : 'g' # გ
93
+ '\u10d3' : 'd' # დ
94
+ '\u10d4' : 'e' # ე
95
+ '\u10d5' : 'v' # ვ
96
+ '\u10d6' : 'z' # ზ
97
+
98
+ '\u10f1' : 'ey' # ჱ
99
+
100
+ '\u10d7' : 't’' # თ
101
+ '\u10d8' : 'i' # ი
102
+ '\u10d9' : 'k’' # კ
103
+ '\u10da' : 'l' # ლ
104
+ '\u10db' : 'm' # მ
105
+ '\u10dc' : 'n' # ნ
106
+
107
+ '\u10f2' : 'j' # ჲ
108
+
109
+ '\u10dd' : 'o' # ო
110
+ '\u10de' : 'p' # პ
111
+ '\u10df' : 'zh' # ჟ
112
+ '\u10e0' : 'r' # რ
113
+ '\u10e1' : 's' # ს
114
+ '\u10e2' : 't' # ტ
115
+ '\u10e3' : 'u' # უ
116
+ '\u10e4' : 'p’' # ფ
117
+ '\u10e5' : 'k’' # ქ
118
+ '\u10e6' : 'gh' # ღ
119
+ '\u10e7' : 'q' # ყ
120
+ '\u10e8' : 'sh' # შ
121
+ '\u10e9' : 'ch’' # ჩ
122
+ '\u10ea' : 'ts’' # ც
123
+ '\u10eb' : 'dz' # ძ
124
+ '\u10ec' : 'ts' # წ
125
+ '\u10ed' : 'ch' # ჭ
126
+ '\u10ee' : 'kh' # ხ
127
+
128
+ '\u10f4' : 'q’' # ჴ
129
+
130
+ '\u10ef' : 'j' # ჯ
131
+ '\u10f0' : 'h' # ჰ
@@ -0,0 +1,42 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2009
4
+ language: iso-639-2:kat
5
+ source_script: Geor
6
+ destination_script: Latn
7
+ name: ROMANIZATION OF GEORGIAN; Georgia 2011 national system; BGN/PCGN 2009 Agreement
8
+ url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/810202/ROMANIZATION_OF_GEORGIAN.pdf
9
+ creation_date: 2009
10
+ confirmation_date: 2011
11
+ description: |
12
+ This romanization system corresponds to that devised in 2002 by the
13
+ State Department of Geodesy and Cartography of Georgia and the
14
+ Institute of Linguistics of the Georgian Academy of Sciences, and
15
+ approved by Presidential Decree 109 of 24 February 2011. It represents
16
+ the Mkhedruli alphabet, as presently used in Georgia. This system was
17
+ adopted by BGN and PCGN in 2009, superseding the BGN/PCGN system of
18
+ 1981.
19
+
20
+ notes:
21
+ - This system denotes ejective (glottalised) consonants by means of
22
+ an apostrophe. The BGN/PCGN 1981 system instead used the apostrophe to
23
+ denote aspirated consonants (letters 8, 21, 22, 26 & 27).
24
+ - The Romanization columns show only lowercase forms but, when
25
+ romanizing, uppercase and lowercase Roman letters as appropriate should
26
+ be used.
27
+
28
+ tests:
29
+ - source: თბილისი
30
+ expected: tbilisi
31
+
32
+ - source: მეღვინეთუხუცესი
33
+ expected: meghvinetukhutsesi
34
+
35
+ - source: ჭიანჭველა
36
+ expected: ch’ianch’vela
37
+
38
+ - source: ბაყაყი
39
+ expected: baq’aq’i
40
+
41
+ map:
42
+ inherit: "ggg-kat-Geor-Latn-2002"