interscript 0.1.9 → 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +80 -135
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +73 -458
- data/README.adoc +0 -296
- data/aliases.json +0 -1
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -96
- data/lib/interscript/mapping.rb +0 -144
- data/lib/interscript/opal.rb +0 -196
- data/lib/interscript/opal/entrypoint.rb +0 -20
- data/lib/interscript/opal/exports.rb +0 -11
- data/lib/interscript/opal/maps.js.erb +0 -8
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
- data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
- data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
- data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
- data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
- data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
- data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
- data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
- data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
- data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
- data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
- data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
- data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -21
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -37
- data/spec/spec_helper.rb +0 -3
@@ -1,163 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: bgnpcgn
|
3
|
-
id: 1981
|
4
|
-
language: iso-639-2:mkd
|
5
|
-
source_script: Cyrl
|
6
|
-
destination_script: Latn
|
7
|
-
name: Makedonian Romanization, BGN/PCGN 1981 System
|
8
|
-
alias:
|
9
|
-
ogc11122:
|
10
|
-
code: mkd_Cyrl2Latn_BGN_1981
|
11
|
-
description: Macedonian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1981 System
|
12
|
-
url: https://github.com/riboseinc/interscript/files/4247920/USBGN_romanization_Macedonian_1981.pdf
|
13
|
-
creation_date: 1981
|
14
|
-
description: BGN/PCGN Romanization table for Makedonian.
|
15
|
-
|
16
|
-
tests:
|
17
|
-
- source: Ѓол
|
18
|
-
expected: Đol
|
19
|
-
- source: Јусек Тепеси
|
20
|
-
expected: Jusek Tepesi
|
21
|
-
- source: Љуги Ќарит
|
22
|
-
expected: Ljugi Ćarit
|
23
|
-
- source: Ќафа Сан
|
24
|
-
expected: Ćafa San
|
25
|
-
- source: Агроплод Ресен
|
26
|
-
expected: Agroplod Resen
|
27
|
-
- source: Алта Чука
|
28
|
-
expected: Alta Čuka
|
29
|
-
- source: Баш Тепе
|
30
|
-
expected: Baš Tepe
|
31
|
-
- source: Браќам
|
32
|
-
expected: Braćam
|
33
|
-
- source: Винарска Визба Агропин
|
34
|
-
expected: Vinarska Vizba Agropin
|
35
|
-
- source: Галичица
|
36
|
-
expected: Galičica
|
37
|
-
- source: Дрењево
|
38
|
-
expected: Drenjevo
|
39
|
-
- source: Енешево
|
40
|
-
expected: Eneševo
|
41
|
-
- source: Иберлија
|
42
|
-
expected: Iberlija
|
43
|
-
- source: Крмзи Су
|
44
|
-
expected: Krmzi Su
|
45
|
-
- source: Лесноски Рид
|
46
|
-
expected: Lesnoski Rid
|
47
|
-
- source: Мала Корабска Врата
|
48
|
-
expected: Mala Korabska Vrata
|
49
|
-
- source: Низок Врв
|
50
|
-
expected: Nizok Vrv
|
51
|
-
- source: Охридско Езеро
|
52
|
-
expected: Ohridsko Ezero
|
53
|
-
- source: Прлиќ
|
54
|
-
expected: Prlić
|
55
|
-
- source: Равна Гора
|
56
|
-
expected: Ravna Gora
|
57
|
-
- source: Сеѓавечкиот Рид
|
58
|
-
expected: Seđavečkiot Rid
|
59
|
-
- source: Трновите Њиве
|
60
|
-
expected: Trnovite Njive
|
61
|
-
- source: Фасов Рид
|
62
|
-
expected: Fasov Rid
|
63
|
-
- source: Црни Камен
|
64
|
-
expected: Crni Kamen
|
65
|
-
- source: Чатал Чешми
|
66
|
-
expected: Čatal Češmi
|
67
|
-
- source: Шехово
|
68
|
-
expected: Šehovo
|
69
|
-
|
70
|
-
notes:
|
71
|
-
- The character ѓ should be romanized g when it occurs before е and и. In other
|
72
|
-
instances, it should be romanized ǵ (Ǵ).
|
73
|
-
- The character ќ should be romanized k when it occurs before е and и. In other
|
74
|
-
instances, it should be romanized ć.
|
75
|
-
|
76
|
-
map:
|
77
|
-
rules:
|
78
|
-
- pattern: "Ѓ(?=[еЕиИ])"
|
79
|
-
result: "G"
|
80
|
-
- pattern: "ѓ(?=[еЕиИ])"
|
81
|
-
result: "g"
|
82
|
-
- pattern: "Ќ(?=[еЕиИ])"
|
83
|
-
result: "K"
|
84
|
-
- pattern: "ќ(?=[еЕиИ])"
|
85
|
-
result: "k"
|
86
|
-
|
87
|
-
postrules:
|
88
|
-
# DZ
|
89
|
-
- pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
|
90
|
-
result: "DZ"
|
91
|
-
#LJ
|
92
|
-
- pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
|
93
|
-
result: "LJ"
|
94
|
-
#NJ
|
95
|
-
- pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
|
96
|
-
result: "NJ"
|
97
|
-
#DŽ
|
98
|
-
- pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
|
99
|
-
result: "DŽ"
|
100
|
-
|
101
|
-
characters:
|
102
|
-
"\u0410": "A"
|
103
|
-
"\u0411": "B"
|
104
|
-
"\u0412": "V"
|
105
|
-
"\u0413": "G"
|
106
|
-
"\u0414": "D"
|
107
|
-
"\u0403": "\u0110" # Đ
|
108
|
-
"\u0415": "E"
|
109
|
-
"\u0416": "\u005a\u030c" # Ž
|
110
|
-
"\u0417": "Z"
|
111
|
-
"\u0405": "Dz"
|
112
|
-
"\u0418": "I"
|
113
|
-
"\u0408": "J"
|
114
|
-
"\u041A": "K"
|
115
|
-
"\u041B": "L"
|
116
|
-
"\u0409": "Lj"
|
117
|
-
"\u041C": "M"
|
118
|
-
"\u041D": "N"
|
119
|
-
"\u040A": "Nj"
|
120
|
-
"\u041E": "O"
|
121
|
-
"\u041F": "P"
|
122
|
-
"\u0420": "R"
|
123
|
-
"\u0421": "S"
|
124
|
-
"\u0422": "T"
|
125
|
-
"\u040c": "\u0106" # Ć
|
126
|
-
"\u0423": "U"
|
127
|
-
"\u0424": "F"
|
128
|
-
"\u0425": "H"
|
129
|
-
"\u0426": "C"
|
130
|
-
"\u0427": "\u0043\u030c" # Č
|
131
|
-
"\u040F": "D\u007a\u030c" # Dž
|
132
|
-
"\u0428": "\u0053\u030c" # Š
|
133
|
-
"\u0430": "a"
|
134
|
-
"\u0431": "b"
|
135
|
-
"\u0432": "v"
|
136
|
-
"\u0433": "g"
|
137
|
-
"\u0434": "d"
|
138
|
-
"\u0453": "\u0111" # đ
|
139
|
-
"\u0435": "e"
|
140
|
-
"\u0436": "\u007a\u030c" # ž
|
141
|
-
"\u0437": "z"
|
142
|
-
"\u0455": "dz"
|
143
|
-
"\u0438": "i"
|
144
|
-
"\u0458": "j"
|
145
|
-
"\u043A": "k"
|
146
|
-
"\u043B": "l"
|
147
|
-
"\u0459": "lj"
|
148
|
-
"\u043C": "m"
|
149
|
-
"\u043D": "n"
|
150
|
-
"\u045A": "nj"
|
151
|
-
"\u043E": "o"
|
152
|
-
"\u043F": "p"
|
153
|
-
"\u0440": "r"
|
154
|
-
"\u0441": "s"
|
155
|
-
"\u0442": "t"
|
156
|
-
"\u045c": "\u0107" # ć
|
157
|
-
"\u0443": "u"
|
158
|
-
"\u0444": "f"
|
159
|
-
"\u0445": "h"
|
160
|
-
"\u0446": "c"
|
161
|
-
"\u0447": "\u0063\u030c" # č
|
162
|
-
"\u045F": "d\u007a\u030c" # dž
|
163
|
-
"\u0448": "\u0073\u030c" # š
|
@@ -1,190 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: bgnpcgn
|
3
|
-
id: 2013
|
4
|
-
language: iso-639-2:mkd
|
5
|
-
source_script: Cyrl
|
6
|
-
destination_script: Latn
|
7
|
-
name: Makedonian Romanization, BGN/PCGN 2013 System
|
8
|
-
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
|
9
|
-
creation_date: 2013
|
10
|
-
description: |
|
11
|
-
Macedonian was officially established as a written language in Yugoslavia during
|
12
|
-
World War II and is now the official language of North Macedonia.
|
13
|
-
This romanization system replaces the BGN/PCGN 1981 agreement and adheres
|
14
|
-
to the most widely-accepted standardization of Macedonian orthography.
|
15
|
-
|
16
|
-
notes:
|
17
|
-
- The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
|
18
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
19
|
-
has been used here for illustrative purposes.
|
20
|
-
- The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
|
21
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
22
|
-
has been used here for illustrative purposes.
|
23
|
-
- The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
|
24
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
25
|
-
has been used here for illustrative purposes.
|
26
|
-
- The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
|
27
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
28
|
-
has been used here for illustrative purposes.
|
29
|
-
- |
|
30
|
-
An inventory of letter-diacritic combinations, with their Unicode encoding,
|
31
|
-
in addition to the unmodified letters of the basic Roman script is:
|
32
|
-
| Ǵ (U+01F4) | ǵ (U+01F5) |
|
33
|
-
| Ž (U+017D) | ž (U+017E) |
|
34
|
-
| Dz (U+01F2)* | dz (U+01F3)* |
|
35
|
-
| Lj (U+01C8)* | lj (U+01C9)* |
|
36
|
-
| Nj (U+01CB)* | nj(U+01CC)* |
|
37
|
-
| Ḱ (U+IE30) | ḱ (U+IE31) |
|
38
|
-
| Č (U+010C) | č (U+010D) |
|
39
|
-
| Dž (U+01C5)* | dž (U+01C6)* |
|
40
|
-
| Š (U+0160) | š (U+0161) |
|
41
|
-
* Note that these characters can also be reproduced with individual letters (e.g. l+j).
|
42
|
-
- The Romanization column shows only lowercase forms but, when romanizing,
|
43
|
-
uppercase and lowercase Roman letters as appropriate should be used.
|
44
|
-
|
45
|
-
tests:
|
46
|
-
- source: Ѓенови Ливаѓе
|
47
|
-
expected: Ǵenovi Livaǵe
|
48
|
-
- source: ЛУЃЕ луѓе
|
49
|
-
expected: LUǴE luǵe
|
50
|
-
- source: ЅВЕЗДА ѕвезда Ѕвезда
|
51
|
-
expected: DZVEZDA dzvezda Dzvezda
|
52
|
-
- source: Јабежица
|
53
|
-
expected: Jabežica
|
54
|
-
- source: Љиќен и Бард
|
55
|
-
expected: Ljiḱen i Bard
|
56
|
-
- source: Ќамилов Чукар
|
57
|
-
expected: Ḱamilov Čukar
|
58
|
-
- source: Џавидин Кајнак
|
59
|
-
expected: Džavidin Kajnak
|
60
|
-
- source: Џамалџи
|
61
|
-
expected: Džamaldži
|
62
|
-
- source: Џибра Гури и Зи
|
63
|
-
expected: Džibra Guri i Zi
|
64
|
-
- source: Абазова Куќарица
|
65
|
-
expected: Abazova Kuḱarica
|
66
|
-
- source: Баба Анѓина Маала
|
67
|
-
expected: Baba Anǵina Maala
|
68
|
-
- source: Ваљановец
|
69
|
-
expected: Valjanovec
|
70
|
-
- source: Галал Једи Дереш
|
71
|
-
expected: Galal Jedi Dereš
|
72
|
-
- source: Дванаесет Клајнци
|
73
|
-
expected: Dvanaeset Klajnci
|
74
|
-
- source: Електродистрибуција Струга
|
75
|
-
expected: Elektrodistribucija Struga
|
76
|
-
- source: Железничка Станица Рајко Жинзифов
|
77
|
-
expected: Železnička Stanica Rajko Žinzifov
|
78
|
-
- source: Заедничко Речиште
|
79
|
-
expected: Zaedničko Rečište
|
80
|
-
- source: Испраена Плоча
|
81
|
-
expected: Ispraena Ploča
|
82
|
-
- source: Казнено-Поправна Установа Идризово
|
83
|
-
expected: Kazneno-Popravna Ustanova Idrizovo
|
84
|
-
- source: Лази и Зејнелит
|
85
|
-
expected: Lazi i Zejnelit
|
86
|
-
- source: Мавровско Езеро
|
87
|
-
expected: Mavrovsko Ezero
|
88
|
-
- source: Национален Парк Галичица
|
89
|
-
expected: Nacionalen Park Galičica
|
90
|
-
- source: Одморалиште Свети Стефан
|
91
|
-
expected: Odmoralište Sveti Stefan
|
92
|
-
- source: Планинарски Дом Караџица
|
93
|
-
expected: Planinarski Dom Karadžica
|
94
|
-
- source: Раса е Лисењит
|
95
|
-
expected: Rasa e Lisenjit
|
96
|
-
- source: Скочивирска Клисура
|
97
|
-
expected: Skočivirska Klisura
|
98
|
-
- source: Термо-електроцентрала Неготино
|
99
|
-
expected: Termo-elektrocentrala Negotino
|
100
|
-
- source: Узуновско Бресје
|
101
|
-
expected: Uzunovsko Bresje
|
102
|
-
- source: Фабрика Југохром
|
103
|
-
expected: Fabrika Jugohrom
|
104
|
-
- source: Хидроелектрана Сапунџица
|
105
|
-
expected: Hidroelektrana Sapundžica
|
106
|
-
- source: Цветковско Рамниште
|
107
|
-
expected: Cvetkovsko Ramnište
|
108
|
-
- source: Чалтанова Пештера
|
109
|
-
expected: Čaltanova Peštera
|
110
|
-
- source: Шкемби Вишнејц
|
111
|
-
expected: Škembi Višnejc
|
112
|
-
|
113
|
-
map:
|
114
|
-
postrules:
|
115
|
-
# DZ
|
116
|
-
- pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
|
117
|
-
result: "DZ"
|
118
|
-
#LJ
|
119
|
-
- pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
|
120
|
-
result: "LJ"
|
121
|
-
#NJ
|
122
|
-
- pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
|
123
|
-
result: "NJ"
|
124
|
-
#DŽ
|
125
|
-
- pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
|
126
|
-
result: "DŽ"
|
127
|
-
|
128
|
-
characters:
|
129
|
-
"\u0410": "A"
|
130
|
-
"\u0411": "B"
|
131
|
-
"\u0412": "V"
|
132
|
-
"\u0413": "G"
|
133
|
-
"\u0414": "D"
|
134
|
-
"\u0403": "\u01F4" # Ǵ
|
135
|
-
"\u0415": "E"
|
136
|
-
"\u0416": "\u005a\u030c" # Ž
|
137
|
-
"\u0417": "Z"
|
138
|
-
"\u0405": "Dz"
|
139
|
-
"\u0418": "I"
|
140
|
-
"\u0408": "J"
|
141
|
-
"\u041A": "K"
|
142
|
-
"\u041B": "L"
|
143
|
-
"\u0409": "Lj"
|
144
|
-
"\u041C": "M"
|
145
|
-
"\u041D": "N"
|
146
|
-
"\u040A": "Nj"
|
147
|
-
"\u041E": "O"
|
148
|
-
"\u041F": "P"
|
149
|
-
"\u0420": "R"
|
150
|
-
"\u0421": "S"
|
151
|
-
"\u0422": "T"
|
152
|
-
"\u040C": "\u004b\u0301" # Ḱ
|
153
|
-
"\u0423": "U"
|
154
|
-
"\u0424": "F"
|
155
|
-
"\u0425": "H"
|
156
|
-
"\u0426": "C"
|
157
|
-
"\u0427": "\u0043\u030c" # Č
|
158
|
-
"\u040F": "D\u007a\u030c" # Dž
|
159
|
-
"\u0428": "\u0053\u030c" # Š
|
160
|
-
"\u0430": "a"
|
161
|
-
"\u0431": "b"
|
162
|
-
"\u0432": "v"
|
163
|
-
"\u0433": "g"
|
164
|
-
"\u0434": "d"
|
165
|
-
"\u0453": "\u01F5" # ǵ
|
166
|
-
"\u0435": "e"
|
167
|
-
"\u0436": "\u007a\u030c" # ž
|
168
|
-
"\u0437": "z"
|
169
|
-
"\u0455": "dz"
|
170
|
-
"\u0438": "i"
|
171
|
-
"\u0458": "j"
|
172
|
-
"\u043A": "k"
|
173
|
-
"\u043B": "l"
|
174
|
-
"\u0459": "lj"
|
175
|
-
"\u043C": "m"
|
176
|
-
"\u043D": "n"
|
177
|
-
"\u045A": "nj"
|
178
|
-
"\u043E": "o"
|
179
|
-
"\u043F": "p"
|
180
|
-
"\u0440": "r"
|
181
|
-
"\u0441": "s"
|
182
|
-
"\u0442": "t"
|
183
|
-
"\u045C": "\u1E31" # ḱ
|
184
|
-
"\u0443": "u"
|
185
|
-
"\u0444": "f"
|
186
|
-
"\u0445": "h"
|
187
|
-
"\u0446": "c"
|
188
|
-
"\u0447": "\u0063\u030c" # č
|
189
|
-
"\u045F": "d\u007a\u030c" # dž
|
190
|
-
"\u0448": "\u0073\u030c" # š
|
@@ -1,223 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: bgnpcgn
|
3
|
-
id: 1964
|
4
|
-
language: iso-639-2:mon
|
5
|
-
source_script: Cyrl
|
6
|
-
destination_script: Latn
|
7
|
-
name: BGN/PCGN 1964 System
|
8
|
-
alias:
|
9
|
-
ogc11122:
|
10
|
-
code: mon_Cyrl2Latn_BGN_1964
|
11
|
-
description: Mongolian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1964 System
|
12
|
-
url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
|
13
|
-
creation_date:
|
14
|
-
confirmation_date:
|
15
|
-
description: |
|
16
|
-
This system was originated by the PCGN in 1957 and adopted as a
|
17
|
-
BGN/PCGN System in 1964. It is intended for use in the romanization of
|
18
|
-
geographic names in the "Mongolian People's Republic" but not to romanize
|
19
|
-
Mongolian names in adjacent parts of China and the U.S.S.R.
|
20
|
-
|
21
|
-
notes: |
|
22
|
-
- b occurs initially and after л, м, and б.
|
23
|
-
- v occurs medially in Mongolian words and initially in foreign words.
|
24
|
-
- y occurs only as the second element of diphthongs.
|
25
|
-
- k, p, f, and shch occurs foreign words only.
|
26
|
-
- "\u2019" occurs only in Russion words.
|
27
|
-
- ï occurs only in suffixes to words containing back vowels (a, o, and u).
|
28
|
-
- In monosyllables yu or yü depending on pronunciation; in polysyllables yu when followed by a, o, or u, but yü when followed by i, e, ö, or ü.
|
29
|
-
|
30
|
-
tests:
|
31
|
-
- source: Эрдэнэт Сум
|
32
|
-
expected: Erdenet Sum
|
33
|
-
- source: Эрдэнэт
|
34
|
-
expected: Erdenet
|
35
|
-
- source: Эрдэнэ
|
36
|
-
expected: Erdene
|
37
|
-
- source: Шивээговь Сум
|
38
|
-
expected: Shiveegovĭ Sum
|
39
|
-
- source: Шивээговь
|
40
|
-
expected: Shiveegovĭ
|
41
|
-
- source: Шарынгол Сум
|
42
|
-
expected: Sharïngol Sum
|
43
|
-
- source: Шарынгол
|
44
|
-
expected: Sharïngol
|
45
|
-
- source: Цагааннуур
|
46
|
-
expected: Tsagaannuur
|
47
|
-
- source: Хонгор Сум
|
48
|
-
expected: Hongor Sum
|
49
|
-
- source: Хонгор
|
50
|
-
expected: Hongor
|
51
|
-
- source: Хайлаастай
|
52
|
-
expected: Haylaastay
|
53
|
-
- source: Түнэл Сум
|
54
|
-
expected: Tünel Sum
|
55
|
-
- source: Түнэл
|
56
|
-
expected: Tünel
|
57
|
-
- source: Сүхбаатар
|
58
|
-
expected: Sühbaatar
|
59
|
-
- source: Сүмбэр Сум
|
60
|
-
expected: Sümber Sum
|
61
|
-
- source: Сүмбэр
|
62
|
-
expected: Sümber
|
63
|
-
- source: Сайншанд Сум
|
64
|
-
expected: Saynshand Sum
|
65
|
-
- source: Сайншанд
|
66
|
-
expected: Saynshand
|
67
|
-
- source: Орхон Сум
|
68
|
-
expected: Orhon Sum
|
69
|
-
- source: Орхон
|
70
|
-
expected: Orhon
|
71
|
-
- source: Нарст
|
72
|
-
expected: Narst
|
73
|
-
- source: Мөрөн Сум
|
74
|
-
expected: Mörön Sum
|
75
|
-
- source: Мөрөн
|
76
|
-
expected: Mörön
|
77
|
-
- source: Зүүнхөвөө
|
78
|
-
expected: Dzüünhövöö
|
79
|
-
- source: Жаргалант Сум
|
80
|
-
expected: Jargalant Sum
|
81
|
-
- source: Жаргалант
|
82
|
-
expected: Jargalant
|
83
|
-
- source: Дархан Сум
|
84
|
-
expected: Darhan Sum
|
85
|
-
- source: Даланзадгад Сум
|
86
|
-
expected: Dalandzadgad Sum
|
87
|
-
- source: Даланзадгад
|
88
|
-
expected: Dalandzadgad
|
89
|
-
- source: Давст Сум
|
90
|
-
expected: Davst Sum
|
91
|
-
- source: Давст
|
92
|
-
expected: Davst
|
93
|
-
- source: Говьсүмбэр Сум
|
94
|
-
expected: Govĭsümber Sum
|
95
|
-
- source: Говь
|
96
|
-
expected: Govĭ
|
97
|
-
- source: Буга
|
98
|
-
expected: Buga
|
99
|
-
- source: Бор-Өндөр Сум
|
100
|
-
expected: Bor-Öndör Sum
|
101
|
-
- source: Бор-Өндөр
|
102
|
-
expected: Bor-Öndör
|
103
|
-
- source: Баянхонгор
|
104
|
-
expected: Bayanhongor
|
105
|
-
- source: Баянтал
|
106
|
-
expected: Bayantal
|
107
|
-
- source: Баяндэлгэр Сум
|
108
|
-
expected: Bayandelger Sum
|
109
|
-
- source: Баяндэлгэр
|
110
|
-
expected: Bayandelger
|
111
|
-
- source: Баян-Өндөр Сум
|
112
|
-
expected: Bayan-Öndör Sum
|
113
|
-
- source: Баруун-Урт Сум
|
114
|
-
expected: Baruun-Urt Sum
|
115
|
-
- source: Баруун-Урт
|
116
|
-
expected: Baruun-Urt
|
117
|
-
- source: Архуст
|
118
|
-
expected: Arhust
|
119
|
-
- source: Арвайхээр Сум
|
120
|
-
expected: Arvayheer Sum
|
121
|
-
- source: Арвайхээр
|
122
|
-
expected: Arvayheer
|
123
|
-
- source: Есөнбулаг Сум
|
124
|
-
expected: Yösönbulag Sum
|
125
|
-
- source: Ерөө Сум
|
126
|
-
expected: Yöröö Sum
|
127
|
-
- source: Есөнзүйл Сум
|
128
|
-
expected: Yösöndzüyl Sum
|
129
|
-
- source: Ноён Сум
|
130
|
-
expected: Noyon Sum
|
131
|
-
- source: Родник Балянгийн-Булак
|
132
|
-
expected: Rodnik Balyangiyn-Bulak
|
133
|
-
- source: Замын-Үүд Сум
|
134
|
-
expected: Dzamïn-Üüd Sum
|
135
|
-
- source: Адаацаг Сум
|
136
|
-
expected: Adaatsag Sum
|
137
|
-
- source: Чандмань Сум
|
138
|
-
expected: Chandmanĭ Sum
|
139
|
-
- source: Хяргас Сум
|
140
|
-
expected: Hyargas Sum
|
141
|
-
|
142
|
-
map:
|
143
|
-
rules:
|
144
|
-
- pattern: \u042e(?=[АаОоУу]) # Ю before а, о, or у
|
145
|
-
result: "Yu"
|
146
|
-
- pattern: \u044e(?=[АаОоУу]) # ю before а, о, or у
|
147
|
-
result: "yu"
|
148
|
-
- pattern: \u042e(?=[ИиЭэӨөҮү]) # Ю before и, э, ө, or ү
|
149
|
-
result: "Yü"
|
150
|
-
- pattern: \u044e(?=[ИиЭэӨөҮү]) # ю before и, э, ө, or ү
|
151
|
-
result: "yü"
|
152
|
-
|
153
|
-
characters:
|
154
|
-
"А": "A" # \u0410
|
155
|
-
"Б": "B" # \u0411
|
156
|
-
"В": "V" # \u0412
|
157
|
-
"Г": "G" # \u0413
|
158
|
-
"Д": "D" # \u0414
|
159
|
-
"Е": "Yö" # \u0415
|
160
|
-
"Ё": "Yo" # \u0401
|
161
|
-
"Ж": "J" # \u0416
|
162
|
-
"З": "Dz" # \u0417
|
163
|
-
"И": "I" # \u0418
|
164
|
-
"Й": "Y" # \u0419
|
165
|
-
"К": "K" # \u041a
|
166
|
-
"Л": "L" # \u041b
|
167
|
-
"М": "M" # \u041c
|
168
|
-
"Н": "N" # \u041d
|
169
|
-
"О": "O" # \u041e
|
170
|
-
"Ө": "Ö" # \u04e8
|
171
|
-
"П": "P" # \u041f
|
172
|
-
"Р": "R" # \u0420
|
173
|
-
"С": "S" # \u0421
|
174
|
-
"Т": "T" # \u0422
|
175
|
-
"У": "U" # \u0423
|
176
|
-
"Ү": "Ü" # \u04ae
|
177
|
-
"Ф": "F" # \u0424
|
178
|
-
"Х": "H" # \u0425
|
179
|
-
"Ц": "Ts" # \u0426
|
180
|
-
"Ч": "Ch" # \u0427
|
181
|
-
"Ш": "Sh" # \u0428
|
182
|
-
"Щ": "Shch" # \u0429
|
183
|
-
"Ъ": "\u2019" # \u042a
|
184
|
-
"Ы": "Ï" # \u042b
|
185
|
-
"Ь": "Ĭ" # \u042c
|
186
|
-
"Э": "E" # \u042d
|
187
|
-
"Ю": "Yu" # \u042e
|
188
|
-
"Я": "Ya" # \u042f
|
189
|
-
"а": "a" # \u0430
|
190
|
-
"б": "b" # \u0431
|
191
|
-
"в": "v" # \u0432
|
192
|
-
"г": "g" # \u0433
|
193
|
-
"д": "d" # \u0434
|
194
|
-
"е": "yö" # \u0435
|
195
|
-
"ё": "yo" # \u0451
|
196
|
-
"ж": "j" # \u0436
|
197
|
-
"з": "dz" # \u0437
|
198
|
-
"и": "i" # \u0438
|
199
|
-
"й": "y" # \u0439
|
200
|
-
"к": "k" # \u043a
|
201
|
-
"л": "l" # \u043b
|
202
|
-
"м": "m" # \u043c
|
203
|
-
"н": "n" # \u043d
|
204
|
-
"о": "o" # \u043e
|
205
|
-
"ө": "ö" # \u04e9
|
206
|
-
"п": "p" # \u043f
|
207
|
-
"р": "r" # \u0440
|
208
|
-
"с": "s" # \u0441
|
209
|
-
"т": "t" # \u0442
|
210
|
-
"у": "u" # \u0443
|
211
|
-
"ү": "ü" # \u04af
|
212
|
-
"ф": "f" # \u0444
|
213
|
-
"х": "h" # \u0445
|
214
|
-
"ц": "ts" # \u0446
|
215
|
-
"ч": "ch" # \u0447
|
216
|
-
"ш": "sh" # \u0448
|
217
|
-
"щ": "shch" # \u0449
|
218
|
-
"ъ": "\u2019" # \u044a
|
219
|
-
"ы": "ï" # \u044b
|
220
|
-
"ь": "ĭ" # \u044c
|
221
|
-
"э": "e" # \u044d
|
222
|
-
"ю": "yu" # \u044e
|
223
|
-
"я": "ya" # \u044f
|