interscript 0.1.6 → 0.1.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (251) hide show
  1. checksums.yaml +4 -4
  2. data/lib/interscript.rb +10 -6
  3. data/lib/interscript/fs.rb +0 -2
  4. data/lib/interscript/mapping.rb +1 -1
  5. data/lib/interscript/opal.rb +38 -8
  6. data/lib/interscript/opal/entrypoint.rb +12 -0
  7. data/lib/interscript/opal/map_translate.rb +7 -0
  8. data/lib/interscript/version.rb +1 -1
  9. data/maps/acadsin-zho-Hani-Latn-2002.yaml +5 -1
  10. data/maps/alalc-amh-Ethi-Latn-1997.yaml +5 -1
  11. data/maps/alalc-amh-Ethi-Latn-2011.yaml +1 -1
  12. data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -1
  13. data/maps/alalc-asm-Deva-Latn-1997.yaml +9 -3
  14. data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
  15. data/maps/alalc-aze-Cyrl-Latn-1997.yaml +5 -1
  16. data/maps/alalc-bel-Cyrl-Latn-1997.yaml +5 -1
  17. data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
  18. data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
  19. data/maps/alalc-ell-Grek-Latn-1997.yaml +5 -1
  20. data/maps/alalc-ell-Grek-Latn-2010.yaml +1 -2
  21. data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
  22. data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
  23. data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
  24. data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
  25. data/maps/alalc-kat-Geok-Latn-1997.yaml +1 -1
  26. data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
  27. data/maps/alalc-kor-Hang-Latn-1997.yaml +5 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
  29. data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
  30. data/maps/alalc-mar-Deva-Latn-1997.yaml +21 -2
  31. data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
  32. data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +1 -1
  33. data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
  34. data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
  35. data/maps/{alalc-pan-Deva-Latn-1997.yaml → alalc-pan-Guru-Latn-1997.yaml} +23 -4
  36. data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
  37. data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
  38. data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
  39. data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
  40. data/maps/alalc-rus-Cyrl-Latn-1997.yaml +5 -1
  41. data/maps/alalc-rus-Cyrl-Latn-2012.yaml +1 -1
  42. data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
  43. data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
  44. data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
  45. data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
  46. data/maps/alalc-srp-Cyrl-Latn-2013.yaml +1 -1
  47. data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
  48. data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
  49. data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
  50. data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
  51. data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
  52. data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -1
  53. data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
  54. data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -1
  55. data/maps/bgn-kor-Hang-Latn-1943.yaml +7 -3
  56. data/maps/bgn-kor-Kore-Latn-1943.yaml +3 -3
  57. data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
  58. data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
  59. data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +5 -1
  60. data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +5 -1
  61. data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
  62. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +2 -2
  63. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +6 -2
  64. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +5 -1
  65. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +5 -1
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
  67. data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
  68. data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +5 -1
  69. data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -1
  70. data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -1
  71. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
  72. data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
  73. data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -1
  74. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +1 -1
  75. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +1 -1
  76. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +1 -1
  77. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
  78. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +1 -1
  79. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
  80. data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +31 -1
  81. data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
  82. data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
  83. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
  84. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
  85. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
  86. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
  87. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
  88. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
  89. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -1
  90. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
  91. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
  92. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
  93. data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +1 -1
  94. data/maps/bis-asm-Beng-Latn-13194-1991.yaml +1 -1
  95. data/maps/bis-ben-Beng-Latn-13194-1991.yaml +1 -1
  96. data/maps/bis-dev-Deva-Latn-13194-1991.yaml +1 -1
  97. data/maps/{bis-gjr-Gujr-Latn-13194-1991.yaml → bis-guj-Gujr-Latn-13194-1991.yaml} +17 -2
  98. data/maps/bis-knd-Knda-Latn-13194-1991.yaml +1 -1
  99. data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +1 -1
  100. data/maps/bis-ori-Orya-Latn-13194-1991.yaml +1 -1
  101. data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +1 -1
  102. data/maps/bis-tel-Telu-Latn-13194-1991.yaml +1 -1
  103. data/maps/bis-tml-Taml-Latn-13194-1991.yaml +1 -1
  104. data/maps/by-bel-Cyrl-Latn-1998.yaml +5 -1
  105. data/maps/by-bel-Cyrl-Latn-2007.yaml +1 -1
  106. data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
  107. data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
  108. data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
  109. data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
  110. data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
  111. data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
  112. data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
  113. data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
  114. data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
  115. data/maps/dos-nep-Deva-Latn-1997.yaml +15 -1
  116. data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +3 -3
  117. data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +2 -2
  118. data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -2
  119. data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -2
  120. data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -1
  121. data/maps/gki-bel-Cyrl-Latn-1992.yaml +1 -1
  122. data/maps/gki-bel-Cyrl-Latn-2000.yaml +1 -1
  123. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +7 -3
  124. data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
  125. data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
  126. data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -1
  127. data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -1
  128. data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -1
  129. data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
  130. data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
  131. data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -1
  132. data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
  133. data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -1
  134. data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
  135. data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
  136. data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
  137. data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +8 -4
  138. data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -4
  139. data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
  140. data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
  141. data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
  142. data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
  143. data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
  144. data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
  145. data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
  146. data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
  147. data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
  148. data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
  149. data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
  150. data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
  151. data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
  152. data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
  153. data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
  154. data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
  155. data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
  156. data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
  157. data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
  158. data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -3
  159. data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
  160. data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
  161. data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
  162. data/maps/iso-tha-Thai-Latn-11940-1998.yaml +1 -1
  163. data/maps/kp-kor-Hang-Latn-2002.yaml +25 -17
  164. data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +1 -1
  165. data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
  166. data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
  167. data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
  168. data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
  169. data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
  170. data/maps/mvd-bel-Cyrl-Latn-2008.yaml +2 -2
  171. data/maps/mvd-bel-Cyrl-Latn-2010.yaml +3 -3
  172. data/maps/mvd-rus-Cyrl-Latn-2008.yaml +2 -2
  173. data/maps/mvd-rus-Cyrl-Latn-2010.yaml +2 -2
  174. data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
  175. data/maps/odni-aze-Cyrl-Latn-2015.yaml +1 -1
  176. data/maps/odni-bel-Cyrl-Latn-2015.yaml +1 -1
  177. data/maps/odni-bul-Cyrl-Latn-2015.yaml +2 -2
  178. data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
  179. data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
  180. data/maps/odni-hin-Deva-Latn-2015.yaml +1 -1
  181. data/maps/odni-kat-Geor-Latn-2015.yaml +1 -1
  182. data/maps/odni-kaz-Cyrl-Latn-2015.yaml +1 -1
  183. data/maps/odni-kir-Cyrl-Latn-2015.yaml +1 -1
  184. data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
  185. data/maps/odni-mkd-Cyrl-Latn-2015.yaml +1 -1
  186. data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
  187. data/maps/odni-rus-Cyrl-Latn-2015.yaml +1 -1
  188. data/maps/odni-srp-Cyrl-Latn-2015.yaml +1 -1
  189. data/maps/odni-tat-Cyrl-Latn-2015.yaml +1 -1
  190. data/maps/odni-tgk-Cyrl-Latn-2015.yaml +1 -1
  191. data/maps/odni-uig-Cyrl-Latn-2015.yaml +1 -1
  192. data/maps/odni-ukr-Cyrl-Latn-2015.yaml +1 -1
  193. data/maps/odni-urd-Arab-Latn-2015.yaml +1 -1
  194. data/maps/odni-uzb-Cyrl-Latn-2015.yaml +1 -1
  195. data/maps/royin-tha-Thai-Latn-1939-generic.yaml +1 -1
  196. data/maps/royin-tha-Thai-Latn-1968.yaml +5 -1
  197. data/maps/royin-tha-Thai-Latn-1999-chained.yaml +1 -1
  198. data/maps/royin-tha-Thai-Latn-1999.yaml +5 -1
  199. data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
  200. data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
  201. data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
  202. data/maps/ses-ara-Arab-Latn-1930.yaml +5 -1
  203. data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
  204. data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
  205. data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
  206. data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
  207. data/maps/{ungegn-amh-Ethi-Latn-2016.yaml → un-amh-Ethi-Latn-2016.yaml} +51 -24
  208. data/maps/un-ara-Arab-Latn-1971.yaml +1 -1
  209. data/maps/un-ara-Arab-Latn-1972.yaml +1 -1
  210. data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
  211. data/maps/un-bel-Cyrl-Latn-2007.yaml +1 -1
  212. data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
  213. data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +2 -2
  214. data/maps/un-ell-Grek-Latn-1987-tl.yaml +2 -2
  215. data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -3
  216. data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
  217. data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
  218. data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
  219. data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
  220. data/maps/un-nep-Deva-Latn-1972.yaml +204 -17
  221. data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
  222. data/maps/un-rus-Cyrl-Latn-1987.yaml +1 -1
  223. data/maps/un-ukr-Cyrl-Latn-1998.yaml +35 -12
  224. data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
  225. data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
  226. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
  227. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
  228. data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +1 -1
  229. data/maps/var-kor-Hang-Latn-mr-1939.yaml +2 -2
  230. data/maps/var-kor-Kore-Hang-2013.yaml +1 -1
  231. data/maps/var-kor-Kore-Latn-mr-1939.yaml +1 -1
  232. data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
  233. data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
  234. data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
  235. data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
  236. data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
  237. data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
  238. data/maps/var-tha-Thai-Thai-phonemic.yaml +1 -1
  239. data/maps/var-tha-Thai-Zsym-ipa.yaml +1 -1
  240. data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +6 -2
  241. data/spec/interscript/filenames_spec.rb +384 -0
  242. data/spec/interscript_spec.rb +7 -4
  243. metadata +105 -26
  244. data/bin/interscript +0 -41
  245. data/bin/rspec +0 -29
  246. data/bin/setup +0 -8
  247. data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
  248. data/lib/interscript-opal.rb +0 -2
  249. data/lib/interscript/opal_map_translate.rb +0 -12
  250. data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
  251. data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1952
4
- language: bul
4
+ language: iso-639-2:bul
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: ROMANIZATION SYSTEM FOR BULGARIAN BGN/PCGN of 1952
8
+ alias:
9
+ ogc11122:
10
+ code: bul_Cyrl2Latn_BGN_1952
11
+ description: Bulgarian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) Bulgarian 1952 System
8
12
  url: https://libraries.ucsd.edu/bib/fed/USBGN_romanization.pdf
9
13
  creation_date: 1945
10
14
  confirmation_date: 1952
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 2013
4
- language: bul
4
+ language: iso-639-2:bul
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: BGN/PCGN 2013 Agreement
8
+ alias:
9
+ ogc11122:
10
+ code: bul_Cyrl2Latn_BGN_2013
11
+ description: Bulgarian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names(PCGN) Bulgarian 2013 System
8
12
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811509/ROMANIZATION_OF_BULGARIAN.pdf
9
13
  creation_date: 2013
10
14
  confirmation date: 2019-06
@@ -0,0 +1,184 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 2008
4
+ language: iso-639-2:che
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/835782/TABLE_OF_CORRESPONDENCES_FOR_CHECHEN.pdf
8
+ creation_date: 2008
9
+ confirmation_date: 2019-07
10
+ description: |
11
+ Chechen is an official language within Chechnya, one of the republics of the Russian Federation.
12
+ It will normally be encountered in Cyrillic script, in which case it should be romanized by means of
13
+ the Cyrillic-Roman table of correspondences given below.
14
+
15
+ notes:
16
+ - The letter ə is used to represent short a; a is used for long a.
17
+ - Ye is used word- and syllable-initially. This Cyrillic letter may be encountered as the ligature ie in Chechen-Roman sources.
18
+ - This character occurs only in loan words.
19
+ - q in the combination ккх (qq) and q̇in the combination ккъ (q̇q̇)
20
+ - ŋ when preceding vowel is nasalized.
21
+ - This Cyrillic letter may be encountered as the ligature ꭣ [U+AB63] or the diphthong oa in Chechen Roman sources.
22
+ - Unless in the combinations гӀ, кӀ, пӀ, тӀ, хӀ, цӀ and чӀ.
23
+ - |
24
+ An inventory of letter-diacritic combinations, with their Unicode encoding, in addition to the
25
+ unmodified letters of the basic Roman script is:
26
+
27
+ All apostrophes appearing in romanization are U+2019
28
+
29
+ Ə (U+018F) ə (U+0259)
30
+ Ä (U+00C4) ä (U+00E4)
31
+ Ġ (U+0047+0307) ġ (U+0067+0307)
32
+ Z̵ (U+005A+0335) z̵ (U+007A+0335)
33
+ Q̇ (U+0051+0307) q̇ (U+0071+0307)
34
+ Ŋ (U+014A) ŋ (U+014B)
35
+ Ö (U+00D6) ö (U+00F6)
36
+ Ü (U+00DC) ü (U+00FC)
37
+ Ẋ (U+0058+0307) ẋ (U+0078+0307)
38
+ Ċ (U+0043+0307) ċ (U0063+0307)
39
+ Ç (U+00C7) ç (U+00E7)
40
+ Ç̇ (U+00C7+0307) ç̇ (U+00E7+0307)
41
+ Ş (U+015E) ş (U+015F)
42
+
43
+ - The Roman-script columns show only lowercase forms but, when applying the table, uppercase and lowercase Roman letters as appropriate should be used
44
+
45
+ tests:
46
+ - source: кӏант
47
+ expected: khant
48
+ - source: зуда
49
+ expected: zuda
50
+ - source: пхьагал
51
+ expected: pẋagal
52
+ - source: наж
53
+ expected: naz̵
54
+ - source: мангал
55
+ expected: mangal
56
+ - source: Ӏаж
57
+ expected: Jaz̵
58
+ - source: Нохчийн Википеди
59
+ expected: Noxçiyn Vikipedi
60
+ - source: сагӏадаккхар
61
+ expected: saġadaqqar
62
+ - source: йеза
63
+ expected: yeza
64
+ - source: еара
65
+ expected: yeara
66
+ - source: елха
67
+ expected: yelxa
68
+
69
+ map:
70
+ rules:
71
+ # note[2]
72
+ - pattern: (?<!\b\u2019)\b\u0415 # Е in initial position -> Ye
73
+ result: Ye
74
+ - pattern: (?<!\b\u2019)\b\u0435 # е in initial position -> ye
75
+ result: ye
76
+ # note[4]
77
+ - pattern: \u043A\u043A\u0445
78
+ result: qq
79
+ - pattern: \u043A\u043A\u042A
80
+ result: q̇q̇
81
+ - pattern: \u041A\u041A\u0445
82
+ result: QQ
83
+ - pattern: \u041A\u041A\u042A
84
+ result: Q̇Q̇
85
+
86
+ characters:
87
+ '\u0410' : ['A', 'Ə'] # А note[1]
88
+ '\u0410\u044C' : "A\u0308" # Аь -> Ä
89
+ '\u0411' : 'B' # Б
90
+ '\u0412' : 'V' # В
91
+ '\u0413' : 'G' # Г
92
+ '\u0413\u04C0' : "G\u0307" # ГӀ -> Ġ
93
+ '\u0414' : 'D' # Д
94
+ '\u0415' : 'E' # Е note[2]
95
+ '\u0401' : 'Yo' # Ё note[3]
96
+ '\u0416' : "Z\u0335" # Ж -> Ƶ
97
+ '\u0417' : 'Z' # З
98
+ '\u0418' : 'I' # И
99
+ '\u042B' : 'Y' # Й
100
+ '\u041A' : 'K' # К note[4]
101
+ '\u041A\u0445' : 'Q' # Кх note[4]
102
+ '\u041A\u044A' : "Q\u0307" # Къ -> Q̇ note[4]
103
+ '\u041A\u04C0' : 'Kh' # КӀ note[4]
104
+ '\u041B' : 'L' # Л
105
+ '\u041C' : 'M' # М
106
+ '\u041D' : ['N', 'Ŋ'] # Н note[5]
107
+ '\u041E' : 'O' # О note[6]
108
+ '\u041E\u044C' : "O\u0308" # Оь -> Ö
109
+ '\u041F' : 'P' # П
110
+ '\u041F\u04C0' : 'Ph' # ПӀ
111
+ '\u0420' : 'R' # Р
112
+ '\u0421' : 'S' # С
113
+ '\u0422' : 'T' # Т
114
+ '\u0422\u04C0' : 'Th' # TӀ
115
+ '\u0423' : 'U' # У
116
+ '\u0423\u044C' : "U\u0308" # Уь -> Ü
117
+ '\u0424' : 'F' # Ф
118
+ '\u0425' : 'X' # Х
119
+ '\u0425\u044C' : "X\u0307" # Хь -> Ẋ
120
+ '\u0425\u04C0' : "H" # ХӀ
121
+ '\u04B8' : 'C' # Ц
122
+ '\u04B8\u04C0' : "C\u0307" # ЦӀ -> Ċ
123
+ '\u0427' : "C\u0327" # Ч -> Ç
124
+ '\u0427\u04C0' : "\u00C7\u0307" # ЧӀ -> Ç̇
125
+ '\u0428' : "S\u0327" # Ш -> Ş
126
+ '\u0429' : "S\u0327C\u0327" # Щ -> ŞÇ note[3]
127
+ '\u042A' : "’" # Ъ note[3]
128
+ '\u042B' : "Y" # Ы
129
+ '\u042C' : "" # Ь note[3]
130
+ '\u042D' : "E" # Э
131
+ '\u042E' : "Yu" # Ю
132
+ '\u042E\u044C' : "Yu\u0308" # Юь -> Yü
133
+ '\u042F' : "Ya" # Я
134
+ '\u042F\u044C' : "Ya\u0308" # Яь -> Yä
135
+ '\u04C0' : "J" # Ӏ note[7]
136
+
137
+ '\u0430' : ['a', 'ə'] # а note[1]
138
+ '\u0430\u044C' : "a\u0308" # аь -> ä
139
+ '\u0431' : 'b' # б
140
+ '\u0432' : 'v' # в
141
+ '\u0433' : 'g' # г
142
+ '\u0433\u04CF' : "g\u0307" # гӏ -> ġ
143
+ '\u0434' : 'd' # д
144
+ '\u0435' : 'e' # е note[2]
145
+ '\u0451' : 'yo' # ё note[3]
146
+ '\u0436' : "z\u0335" # ж -> ƶ
147
+ '\u0437' : 'z' # з
148
+ '\u0438' : 'i' # и
149
+ '\u0439' : 'y' # й
150
+ '\u043A' : 'k' # к note[4]
151
+ '\u043A\u0445' : 'q' # кх note[4]
152
+ '\u043A\u044A' : "q\u0307" # къ -> q̇ note[4]
153
+ '\u043A\u04CF' : 'kh' # кӏ note[4]
154
+ '\u043B' : 'l' # л
155
+ '\u043C' : 'm' # м
156
+ '\u043D' : ['n', 'ŋ'] # н note[5]
157
+ '\u043E' : 'o' # о note[6]
158
+ '\u043E\u044C' : "o\u0308" # оь -> ö
159
+ '\u043F' : 'p' # п
160
+ '\u0440' : 'r' # р
161
+ '\u0441' : 's' # с
162
+ '\u0442' : 't' # т
163
+ '\u0442\u04CF' : 'th' # тӏ
164
+ '\u0443' : 'u' # у
165
+ '\u0443\u044C' : "u\u0308" # Уь -> ü
166
+ '\u0444' : 'f' # ф
167
+ '\u0445' : 'x' # х
168
+ '\u0445\u044C' : "x\u0307" # хь -> ẋ
169
+ '\u0445\u04CF' : "h" # хӏ
170
+ '\u04B9' : 'c' # ц
171
+ '\u04B9\u04CF' : "с\u0307" # цӏ -> ċ
172
+ '\u0447' : "c\u0327" # ч -> ç
173
+ '\u0447\u04CF' : "c\u00E7\u0307" # чӏ -> ç̇
174
+ '\u0448' : "s\u0327" # ш -> ş
175
+ '\u0449' : "s\u0327c\u0327" # щ -> şç note[3]
176
+ '\u044A' : "’" # ъ note[3]
177
+ '\u044B' : "y" # ы
178
+ '\u044C' : '' # ь note[3]
179
+ '\u044D' : "e" # э
180
+ '\u044E' : "yu" # ю
181
+ '\u044E' : "yu\u0308" # юь -> yü
182
+ '\u044F' : "ya" # я
183
+ '\u044F' : "ya\u0308" # яь -> yä
184
+ '\u04CF' : "j" # ӏ note[7]
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1962
4
- language: ell
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: BGN/PCGN 1962 System
8
+ alias:
9
+ ogc11122:
10
+ code: ell_Grek2Latn_BGN_1962
11
+ description: US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) Greek 1962 System (out of date)
8
12
  url: https://github.com/riboseinc/interscript/files/4225556/BGN_Romanization_Guide_1962_greek.pdf
9
13
  creation_date: 1962
10
14
  description: |
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1996
4
- language: ell
4
+ language: iso-639-2:ell
5
5
  source_script: Grek
6
6
  destination_script: Latn
7
7
  name: BGN/PCGN 1996 System
8
+ alias:
9
+ ogc11122:
10
+ code: ell_Grek2Latn_ELOT743_1996
11
+ description: Greek ELOT 743 System, US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1996 agreement
8
12
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693694/ROMANIZATION_OF_GREEK.pdf
9
13
  creation_date: 1996
10
14
  description: |
@@ -3,10 +3,14 @@
3
3
  # TODO: Add tests from PDF
4
4
  authority_id: bgnpcgn
5
5
  id: 1956
6
- language: per
6
+ language: iso-639-2:fas
7
7
  source_script: Arab
8
8
  destination_script: Latn
9
9
  name: BGN/PCGN 1956 System
10
+ alias:
11
+ ogc11122:
12
+ code: fas_Arab2Latn_BGN_1958
13
+ description: Persian (Afghan and Iranian) BGN/Permanent Committee on Geographical Names for British Official Use(PCGN) 1958 System
10
14
  url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/320079/Arabic_Romanization.pdf
11
15
  creation_date: 1947
12
16
  confirmation_date: 2019-06
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1930
4
- language: jpn
4
+ language: iso-639-2:jpn
5
5
  source_script: Hrkt
6
6
  destination_script: Latn
7
7
  name: Japanese Kana Modified Hepburn 1930 System
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1981
4
- language: kat
4
+ language: iso-639-2:kat
5
5
  source_script: Geor
6
6
  destination_script: Latn
7
7
  name: ROMANIZATION OF GEORGIAN; BGN/PCGN 1981 System
8
+ alias:
9
+ ogc11122:
10
+ code: kat_Geor2Latn_BGN_1981
11
+ description: Georgian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1981 System
8
12
  url: https://transliteration.eki.ee/pdf/Georgian.pdf
9
13
  creation_date: 1981
10
14
  confirmation_date: 1981
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 2009
4
- language: kat
4
+ language: iso-639-2:kat
5
5
  source_script: Geor
6
6
  destination_script: Latn
7
7
  name: ROMANIZATION OF GEORGIAN; Georgia 2011 national system; BGN/PCGN 2009 Agreement
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: kn-1945
4
- language: kor
4
+ language: iso-639-2:kor
5
5
  source_script: Hang
6
6
  destination_script: Latn
7
7
  name: BGN/PCGN 1945 Agreement
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 2011
4
- language: kor
4
+ language: iso-639-2:kor
5
5
  source_script: Hang
6
6
  destination_script: Latn
7
7
  name: Ministry of Culture and Tourism System (2000) BGN/PCGN 2011 Agreement
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 2011
4
- language: kor
4
+ language: iso-639-2:kor
5
5
  source_script: Kore
6
6
  destination_script: Latn
7
7
  name: Ministry of Culture and Tourism System (2000) BGN/PCGN 2011 Agreement
@@ -1,10 +1,14 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 1981
4
- language: mkd
4
+ language: iso-639-2:mkd
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: Makedonian Romanization, BGN/PCGN 1981 System
8
+ alias:
9
+ ogc11122:
10
+ code: mkd_Cyrl2Latn_BGN_1981
11
+ description: Macedonian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1981 System
8
12
  url: https://github.com/riboseinc/interscript/files/4247920/USBGN_romanization_Macedonian_1981.pdf
9
13
  creation_date: 1981
10
14
  description: BGN/PCGN Romanization table for Makedonian.
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  authority_id: bgnpcgn
3
3
  id: 2013
4
- language: mkd
4
+ language: iso-639-2:mkd
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
7
  name: Makedonian Romanization, BGN/PCGN 2013 System
@@ -0,0 +1,223 @@
1
+ ---
2
+ authority_id: bgnpcgn
3
+ id: 1964
4
+ language: iso-639-2:mon
5
+ source_script: Cyrl
6
+ destination_script: Latn
7
+ name: BGN/PCGN 1964 System
8
+ alias:
9
+ ogc11122:
10
+ code: mon_Cyrl2Latn_BGN_1964
11
+ description: Mongolian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1964 System
12
+ url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
13
+ creation_date:
14
+ confirmation_date:
15
+ description: |
16
+ This system was originated by the PCGN in 1957 and adopted as a
17
+ BGN/PCGN System in 1964. It is intended for use in the romanization of
18
+ geographic names in the "Mongolian People's Republic" but not to romanize
19
+ Mongolian names in adjacent parts of China and the U.S.S.R.
20
+
21
+ notes: |
22
+ - b occurs initially and after л, м, and б.
23
+ - v occurs medially in Mongolian words and initially in foreign words.
24
+ - y occurs only as the second element of diphthongs.
25
+ - k, p, f, and shch occurs foreign words only.
26
+ - "\u2019" occurs only in Russion words.
27
+ - ï occurs only in suffixes to words containing back vowels (a, o, and u).
28
+ - In monosyllables yu or yü depending on pronunciation; in polysyllables yu when followed by a, o, or u, but yü when followed by i, e, ö, or ü.
29
+
30
+ tests:
31
+ - source: Эрдэнэт Сум
32
+ expected: Erdenet Sum
33
+ - source: Эрдэнэт
34
+ expected: Erdenet
35
+ - source: Эрдэнэ
36
+ expected: Erdene
37
+ - source: Шивээговь Сум
38
+ expected: Shiveegovĭ Sum
39
+ - source: Шивээговь
40
+ expected: Shiveegovĭ
41
+ - source: Шарынгол Сум
42
+ expected: Sharïngol Sum
43
+ - source: Шарынгол
44
+ expected: Sharïngol
45
+ - source: Цагааннуур
46
+ expected: Tsagaannuur
47
+ - source: Хонгор Сум
48
+ expected: Hongor Sum
49
+ - source: Хонгор
50
+ expected: Hongor
51
+ - source: Хайлаастай
52
+ expected: Haylaastay
53
+ - source: Түнэл Сум
54
+ expected: Tünel Sum
55
+ - source: Түнэл
56
+ expected: Tünel
57
+ - source: Сүхбаатар
58
+ expected: Sühbaatar
59
+ - source: Сүмбэр Сум
60
+ expected: Sümber Sum
61
+ - source: Сүмбэр
62
+ expected: Sümber
63
+ - source: Сайншанд Сум
64
+ expected: Saynshand Sum
65
+ - source: Сайншанд
66
+ expected: Saynshand
67
+ - source: Орхон Сум
68
+ expected: Orhon Sum
69
+ - source: Орхон
70
+ expected: Orhon
71
+ - source: Нарст
72
+ expected: Narst
73
+ - source: Мөрөн Сум
74
+ expected: Mörön Sum
75
+ - source: Мөрөн
76
+ expected: Mörön
77
+ - source: Зүүнхөвөө
78
+ expected: Dzüünhövöö
79
+ - source: Жаргалант Сум
80
+ expected: Jargalant Sum
81
+ - source: Жаргалант
82
+ expected: Jargalant
83
+ - source: Дархан Сум
84
+ expected: Darhan Sum
85
+ - source: Даланзадгад Сум
86
+ expected: Dalandzadgad Sum
87
+ - source: Даланзадгад
88
+ expected: Dalandzadgad
89
+ - source: Давст Сум
90
+ expected: Davst Sum
91
+ - source: Давст
92
+ expected: Davst
93
+ - source: Говьсүмбэр Сум
94
+ expected: Govĭsümber Sum
95
+ - source: Говь
96
+ expected: Govĭ
97
+ - source: Буга
98
+ expected: Buga
99
+ - source: Бор-Өндөр Сум
100
+ expected: Bor-Öndör Sum
101
+ - source: Бор-Өндөр
102
+ expected: Bor-Öndör
103
+ - source: Баянхонгор
104
+ expected: Bayanhongor
105
+ - source: Баянтал
106
+ expected: Bayantal
107
+ - source: Баяндэлгэр Сум
108
+ expected: Bayandelger Sum
109
+ - source: Баяндэлгэр
110
+ expected: Bayandelger
111
+ - source: Баян-Өндөр Сум
112
+ expected: Bayan-Öndör Sum
113
+ - source: Баруун-Урт Сум
114
+ expected: Baruun-Urt Sum
115
+ - source: Баруун-Урт
116
+ expected: Baruun-Urt
117
+ - source: Архуст
118
+ expected: Arhust
119
+ - source: Арвайхээр Сум
120
+ expected: Arvayheer Sum
121
+ - source: Арвайхээр
122
+ expected: Arvayheer
123
+ - source: Есөнбулаг Сум
124
+ expected: Yösönbulag Sum
125
+ - source: Ерөө Сум
126
+ expected: Yöröö Sum
127
+ - source: Есөнзүйл Сум
128
+ expected: Yösöndzüyl Sum
129
+ - source: Ноён Сум
130
+ expected: Noyon Sum
131
+ - source: Родник Балянгийн-Булак
132
+ expected: Rodnik Balyangiyn-Bulak
133
+ - source: Замын-Үүд Сум
134
+ expected: Dzamïn-Üüd Sum
135
+ - source: Адаацаг Сум
136
+ expected: Adaatsag Sum
137
+ - source: Чандмань Сум
138
+ expected: Chandmanĭ Sum
139
+ - source: Хяргас Сум
140
+ expected: Hyargas Sum
141
+
142
+ map:
143
+ rules:
144
+ - pattern: \u042e(?=[АаОоУу]) # Ю before а, о, or у
145
+ result: "Yu"
146
+ - pattern: \u044e(?=[АаОоУу]) # ю before а, о, or у
147
+ result: "yu"
148
+ - pattern: \u042e(?=[ИиЭэӨөҮү]) # Ю before и, э, ө, or ү
149
+ result: "Yü"
150
+ - pattern: \u044e(?=[ИиЭэӨөҮү]) # ю before и, э, ө, or ү
151
+ result: "yü"
152
+
153
+ characters:
154
+ "А": "A" # \u0410
155
+ "Б": "B" # \u0411
156
+ "В": "V" # \u0412
157
+ "Г": "G" # \u0413
158
+ "Д": "D" # \u0414
159
+ "Е": "Yö" # \u0415
160
+ "Ё": "Yo" # \u0401
161
+ "Ж": "J" # \u0416
162
+ "З": "Dz" # \u0417
163
+ "И": "I" # \u0418
164
+ "Й": "Y" # \u0419
165
+ "К": "K" # \u041a
166
+ "Л": "L" # \u041b
167
+ "М": "M" # \u041c
168
+ "Н": "N" # \u041d
169
+ "О": "O" # \u041e
170
+ "Ө": "Ö" # \u04e8
171
+ "П": "P" # \u041f
172
+ "Р": "R" # \u0420
173
+ "С": "S" # \u0421
174
+ "Т": "T" # \u0422
175
+ "У": "U" # \u0423
176
+ "Ү": "Ü" # \u04ae
177
+ "Ф": "F" # \u0424
178
+ "Х": "H" # \u0425
179
+ "Ц": "Ts" # \u0426
180
+ "Ч": "Ch" # \u0427
181
+ "Ш": "Sh" # \u0428
182
+ "Щ": "Shch" # \u0429
183
+ "Ъ": "\u2019" # \u042a
184
+ "Ы": "Ï" # \u042b
185
+ "Ь": "Ĭ" # \u042c
186
+ "Э": "E" # \u042d
187
+ "Ю": "Yu" # \u042e
188
+ "Я": "Ya" # \u042f
189
+ "а": "a" # \u0430
190
+ "б": "b" # \u0431
191
+ "в": "v" # \u0432
192
+ "г": "g" # \u0433
193
+ "д": "d" # \u0434
194
+ "е": "yö" # \u0435
195
+ "ё": "yo" # \u0451
196
+ "ж": "j" # \u0436
197
+ "з": "dz" # \u0437
198
+ "и": "i" # \u0438
199
+ "й": "y" # \u0439
200
+ "к": "k" # \u043a
201
+ "л": "l" # \u043b
202
+ "м": "m" # \u043c
203
+ "н": "n" # \u043d
204
+ "о": "o" # \u043e
205
+ "ө": "ö" # \u04e9
206
+ "п": "p" # \u043f
207
+ "р": "r" # \u0440
208
+ "с": "s" # \u0441
209
+ "т": "t" # \u0442
210
+ "у": "u" # \u0443
211
+ "ү": "ü" # \u04af
212
+ "ф": "f" # \u0444
213
+ "х": "h" # \u0445
214
+ "ц": "ts" # \u0446
215
+ "ч": "ch" # \u0447
216
+ "ш": "sh" # \u0448
217
+ "щ": "shch" # \u0449
218
+ "ъ": "\u2019" # \u044a
219
+ "ы": "ï" # \u044b
220
+ "ь": "ĭ" # \u044c
221
+ "э": "e" # \u044d
222
+ "ю": "yu" # \u044e
223
+ "я": "ya" # \u044f