interscript 0.1.7 → 2.1.0b1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +116 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +83 -133
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +68 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +68 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +76 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +68 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/interscript/visualize.rb +61 -0
- data/lib/interscript/visualize/group.html.erb +59 -0
- data/lib/interscript/visualize/json.rb +57 -0
- data/lib/interscript/visualize/map.html.erb +46 -0
- data/lib/interscript/visualize/nodes.rb +89 -0
- data/requirements.txt +1 -0
- metadata +78 -416
- data/README.adoc +0 -298
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -69
- data/lib/interscript/mapping.rb +0 -142
- data/lib/interscript/opal.rb +0 -57
- data/lib/interscript/opal/entrypoint.rb +0 -12
- data/lib/interscript/opal/map_translate.rb +0 -7
- data/lib/interscript/opal/maps.js.erb +0 -10
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -384
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -29
- data/spec/spec_helper.rb +0 -3
|
@@ -1,145 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: alalc
|
|
3
|
-
id: 1997
|
|
4
|
-
language: iso-639-2:ukr
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: ALA-LC Romanization System 1997
|
|
8
|
-
alias:
|
|
9
|
-
ogc11122:
|
|
10
|
-
code: ukr_Cyrl2Latn_ALA_1997
|
|
11
|
-
description: Ukrainian ALA-Library of Congress 1997 System
|
|
12
|
-
url: http://catdir.loc.gov/catdir/cpso/romanization/ukrainia.pdf
|
|
13
|
-
creation_date: 1997
|
|
14
|
-
description: |
|
|
15
|
-
The ALA-LC Romanization Tables, published by the American Library Association (1885)
|
|
16
|
-
and Library of Congress (1905). Used to represent bibliographic information by US and
|
|
17
|
-
Canadian libraries, by the British Library since 1975,[3] and in North American publications.
|
|
18
|
-
The latest 1997 revision is very similar to the 1905 version.
|
|
19
|
-
|
|
20
|
-
notes:
|
|
21
|
-
- The z͡h ligature is necessary to distinguish ж from the combination зг.
|
|
22
|
-
- The t͡s ligature is necessary to distinguish ц from the combination тс.
|
|
23
|
-
|
|
24
|
-
tests:
|
|
25
|
-
- source: Автономна Республіка Крим
|
|
26
|
-
expected: Avtonomna Respublika Krym
|
|
27
|
-
- source: Висунь
|
|
28
|
-
expected: Vysunʹ
|
|
29
|
-
- source: Долинське
|
|
30
|
-
expected: Dolynsʹke
|
|
31
|
-
- source: Дубище
|
|
32
|
-
expected: Dubyshche
|
|
33
|
-
- source: Єнакієве
|
|
34
|
-
expected: I͡enakii͡eve
|
|
35
|
-
- source: Зупиночний Пункт Мокіївці
|
|
36
|
-
expected: Zupynochnyĭ Punkt Mokiïvt͡si
|
|
37
|
-
- source: Іванівщина
|
|
38
|
-
expected: Ivanivshchyna
|
|
39
|
-
- source: Киликиїв
|
|
40
|
-
expected: Kylykyïv
|
|
41
|
-
- source: Кожанка
|
|
42
|
-
expected: Koz͡hanka
|
|
43
|
-
- source: Краснянка
|
|
44
|
-
expected: Krasni͡anka
|
|
45
|
-
- source: Краснівка
|
|
46
|
-
expected: Krasnivka
|
|
47
|
-
- source: Мале Микільське
|
|
48
|
-
expected: Male Mykilʹsʹke
|
|
49
|
-
- source: Маломиколаївка
|
|
50
|
-
expected: Malomykolaïvka
|
|
51
|
-
- source: Нове Село
|
|
52
|
-
expected: Nove Selo
|
|
53
|
-
- source: Новопавлівка
|
|
54
|
-
expected: Novopavlivka
|
|
55
|
-
- source: Новошичі
|
|
56
|
-
expected: Novoshychi
|
|
57
|
-
- source: Новоєфремівка
|
|
58
|
-
expected: Novoi͡efremivka
|
|
59
|
-
- source: Одеська Область
|
|
60
|
-
expected: Odesʹka Oblastʹ
|
|
61
|
-
- source: Орлівське
|
|
62
|
-
expected: Orlivsʹke
|
|
63
|
-
- source: Раневичі
|
|
64
|
-
expected: Ranevychi
|
|
65
|
-
- source: Рокувата
|
|
66
|
-
expected: Rokuvata
|
|
67
|
-
- source: Рудаєве
|
|
68
|
-
expected: Rudai͡eve
|
|
69
|
-
- source: Сахнівці
|
|
70
|
-
expected: Sakhnivt͡si
|
|
71
|
-
- source: Тернівка
|
|
72
|
-
expected: Ternivka
|
|
73
|
-
- source: Турбівка
|
|
74
|
-
expected: Turbivka
|
|
75
|
-
- source: Херсонська Область
|
|
76
|
-
expected: Khersonsʹka Oblastʹ
|
|
77
|
-
|
|
78
|
-
map:
|
|
79
|
-
characters:
|
|
80
|
-
"\u0410": "A" # А
|
|
81
|
-
"\u0411": "B" # Б
|
|
82
|
-
"\u0412": "V" # В
|
|
83
|
-
"\u0413": "H" # Г
|
|
84
|
-
"\u0490": "G" # Ґ
|
|
85
|
-
"\u0414": "D" # Д
|
|
86
|
-
"\u0415": "E" # Е
|
|
87
|
-
"\u0404": "I\u0361e" # Є -> I͡e
|
|
88
|
-
"\u0416": "Z\u0361h" # Ж -> Z͡h
|
|
89
|
-
"\u0417": "Z" # З
|
|
90
|
-
"\u0418": "Y" # И
|
|
91
|
-
"\u0406": "I" # І
|
|
92
|
-
"\u0407": "I\u0308" # Ї -> Ï
|
|
93
|
-
"\u0419": "I\u0306" # Й -> Ĭ
|
|
94
|
-
"\u041a": "K" # К
|
|
95
|
-
"\u041b": "L" # Л
|
|
96
|
-
"\u041c": "M" # М
|
|
97
|
-
"\u041d": "N" # Н
|
|
98
|
-
"\u041e": "O" # О
|
|
99
|
-
"\u041f": "P" # П
|
|
100
|
-
"\u0420": "R" # Р
|
|
101
|
-
"\u0421": "S" # С
|
|
102
|
-
"\u0422": "T" # Т
|
|
103
|
-
"\u0423": "U" # У
|
|
104
|
-
"\u0424": "F" # Ф
|
|
105
|
-
"\u0425": "Kh" # Х
|
|
106
|
-
"\u0426": "T\u0361s" # Ц -> T͡s
|
|
107
|
-
"\u0427": "Ch" # Ч
|
|
108
|
-
"\u0428": "Sh" # Ш
|
|
109
|
-
"\u0429": "Shch" # Щ
|
|
110
|
-
"\u042e": "I\u0361u" # Ю -> I͡u
|
|
111
|
-
"\u042f": "I\u0361a" # Я -> I͡a
|
|
112
|
-
"\u042c": "\u02B9" # Ь -> ʹ
|
|
113
|
-
"\u0430": "a" # а
|
|
114
|
-
"\u0431": "b" # б
|
|
115
|
-
"\u0432": "v" # в
|
|
116
|
-
"\u0433": "h" # г
|
|
117
|
-
"\u0491": "g" # ґ
|
|
118
|
-
"\u0434": "d" # д
|
|
119
|
-
"\u0435": "e" # е
|
|
120
|
-
"\u0454": "i\u0361e" # є -> i͡e
|
|
121
|
-
"\u0436": "z\u0361h" # ж -> z͡h
|
|
122
|
-
"\u0437": "z" # з
|
|
123
|
-
"\u0438": "y" # и
|
|
124
|
-
"\u0456": "i" # і
|
|
125
|
-
"\u0457": "i\u0308" # ї -> ï
|
|
126
|
-
"\u0439": "i\u0306" # й -> ĭ
|
|
127
|
-
"\u043a": "k" # к
|
|
128
|
-
"\u043b": "l" # л
|
|
129
|
-
"\u043c": "m" # м
|
|
130
|
-
"\u043d": "n" # н
|
|
131
|
-
"\u043e": "o" # о
|
|
132
|
-
"\u043f": "p" # п
|
|
133
|
-
"\u0440": "r" # р
|
|
134
|
-
"\u0441": "s" # с
|
|
135
|
-
"\u0442": "t" # т
|
|
136
|
-
"\u0443": "u" # у
|
|
137
|
-
"\u0444": "f" # ф
|
|
138
|
-
"\u0445": "kh" # х
|
|
139
|
-
"\u0446": "t\u0361s" # ц -> t͡s
|
|
140
|
-
"\u0447": "ch" # ч
|
|
141
|
-
"\u0448": "sh" # ш
|
|
142
|
-
"\u0449": "shch" # щ
|
|
143
|
-
"\u044e": "i\u0361u" # ю -> i͡u
|
|
144
|
-
"\u044f": "i\u0361a" # я -> i͡a
|
|
145
|
-
"\u044c": "\u02B9" # Ь -> ʹ
|
|
@@ -1,16 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: alalc
|
|
3
|
-
id: 2011
|
|
4
|
-
language: iso-639-2:ukr
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: ALA-LC Romanization System 1997
|
|
8
|
-
url: https://www.loc.gov/catdir/cpso/romanization/ukrainia.pdf
|
|
9
|
-
creation_date: 2011
|
|
10
|
-
|
|
11
|
-
notes:
|
|
12
|
-
- The z͡h ligature is necessary to distinguish ж from the combination зг.
|
|
13
|
-
- The t͡s ligature is necessary to distinguish ц from the combination тс.
|
|
14
|
-
|
|
15
|
-
map:
|
|
16
|
-
inherit: alalc-ukr-Cyrl-Latn-1997
|
|
@@ -1,283 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: apcbg
|
|
3
|
-
id: 1995
|
|
4
|
-
language: iso-639-2:bul
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: Toponymic Guidelines for Antarctica, Lyubomir Ivanov. Antarctic Place-names Commission of Bulgaria, Sofia, 1995.
|
|
8
|
-
url: http://www.apcbg.org/Toponymic-Guidelines.htm
|
|
9
|
-
creation_date: 1995
|
|
10
|
-
description: |
|
|
11
|
-
In Antarctica geographical names are important elements of identification, orientation, localization and navigation,
|
|
12
|
-
providing an essential reference system for logistic operations, including search and rescue measures, and for
|
|
13
|
-
international scientific research. They facilitate information exchange in the field, in scientific publications and in
|
|
14
|
-
administrative measures under the Antarctic Treaty System. Geographical names also reflect the history of Antarctic
|
|
15
|
-
exploration.
|
|
16
|
-
|
|
17
|
-
tests:
|
|
18
|
-
- source: нунатак Абрит
|
|
19
|
-
expected: nunatak Abrit
|
|
20
|
-
- source: връх Академия
|
|
21
|
-
expected: vrah Akademiya
|
|
22
|
-
- source: връх Ами Буе
|
|
23
|
-
expected: vrah Ami Bue
|
|
24
|
-
- source: нос Айтос
|
|
25
|
-
expected: nos Aytos
|
|
26
|
-
- source: залив Баба Тонка
|
|
27
|
-
expected: zaliv Baba Tonka
|
|
28
|
-
- source: Балабански камък
|
|
29
|
-
expected: Balabanski kamak
|
|
30
|
-
- source: Бедечки поток
|
|
31
|
-
expected: Bedechki potok
|
|
32
|
-
- source: нос Бяга
|
|
33
|
-
expected: nos Byaga
|
|
34
|
-
- source: остров Качо
|
|
35
|
-
expected: ostrov Kacho # wiki ostrov Cacho
|
|
36
|
-
- source: Чакъров остров
|
|
37
|
-
expected: Chakarov ostrov
|
|
38
|
-
- source: връх Дъбник
|
|
39
|
-
expected: vrah Dabnik
|
|
40
|
-
- source: залив Десислава
|
|
41
|
-
expected: zaliv Desislava
|
|
42
|
-
- source: ледник Джераси
|
|
43
|
-
expected: lednik Dzherasi
|
|
44
|
-
- source: Джегова скала
|
|
45
|
-
expected: Dzhegova skala
|
|
46
|
-
- source: Нунатак Едуард
|
|
47
|
-
expected: Nunatak Eduard
|
|
48
|
-
- source: Елховска седловина
|
|
49
|
-
expected: Elhovska sedlovina
|
|
50
|
-
- source: ледник Етър
|
|
51
|
-
expected: lednik Etar
|
|
52
|
-
- source: нунатак Филип Тотю
|
|
53
|
-
expected: nunatak Filip Totyu
|
|
54
|
-
- source: ледник Габаре
|
|
55
|
-
expected: lednik Gabare
|
|
56
|
-
- source: риф Гергини
|
|
57
|
-
expected: rif Gergini
|
|
58
|
-
- source: Гяуров връх
|
|
59
|
-
expected: Gyaurov vrah
|
|
60
|
-
- source: Гуцалски рид
|
|
61
|
-
expected: Gutsalski rid # not found
|
|
62
|
-
- source: Хараламбиев остров
|
|
63
|
-
expected: Haralambiev ostrov
|
|
64
|
-
- source: връх Ичера
|
|
65
|
-
expected: vrah Ichera
|
|
66
|
-
- source: полуостров Йоан Павел II
|
|
67
|
-
expected: poluostrov Yoan Pavel II
|
|
68
|
-
- source: нос Иван Александър
|
|
69
|
-
expected: nos Ivan Aleksandar
|
|
70
|
-
- source: нос Иречек
|
|
71
|
-
expected: nos Irechek
|
|
72
|
-
- source: нос Кърджали
|
|
73
|
-
expected: nos Kardzhali
|
|
74
|
-
- source: седловина Кърнаре
|
|
75
|
-
expected: sedlovina Karnare
|
|
76
|
-
- source: нунатак Керсеблепт
|
|
77
|
-
expected: nunatak Kerseblept
|
|
78
|
-
- source: Кондофрейски възвишения
|
|
79
|
-
expected: Kondofreyski vazvisheniya
|
|
80
|
-
- source: Костинбродски проход
|
|
81
|
-
expected: Kostinbrodski prohod
|
|
82
|
-
- source: връх Кожух
|
|
83
|
-
expected: vrah Kozhuh
|
|
84
|
-
- source: Кукерски нунатаци
|
|
85
|
-
expected: Kukerski nunatatsi
|
|
86
|
-
- source: залив Лазурен бряг
|
|
87
|
-
expected: zaliv Lazuren bryag
|
|
88
|
-
- source: връх Лудогорие
|
|
89
|
-
expected: vrah Ludogorie
|
|
90
|
-
- source: Лютибродски скали
|
|
91
|
-
expected: Lyutibrodski skali
|
|
92
|
-
- source: Масларов нунатак
|
|
93
|
-
expected: Maslarov nunatak
|
|
94
|
-
- source: Михневски връх
|
|
95
|
-
expected: Mihnevski vrah
|
|
96
|
-
- source: рид Митино
|
|
97
|
-
expected: rid Mitino
|
|
98
|
-
- source: езеро Наяда
|
|
99
|
-
expected: ezero Nayada
|
|
100
|
-
- source: нос Никюп
|
|
101
|
-
expected: nos Nikyup
|
|
102
|
-
- source: рид Оборище
|
|
103
|
-
expected: rid Oborishte
|
|
104
|
-
- source: залив Олуша
|
|
105
|
-
expected: zaliv Olusha
|
|
106
|
-
- source: Оряховски възвишения
|
|
107
|
-
expected: Oryahovski vazvisheniya
|
|
108
|
-
- source: нунатак Памидово
|
|
109
|
-
expected: nunatak Pamidovo
|
|
110
|
-
- source: връх Парангалица
|
|
111
|
-
expected: vrah Parangalitsa
|
|
112
|
-
- source: Първомайски провлак
|
|
113
|
-
expected: Parvomayski provlak
|
|
114
|
-
- source: ледник Патлейна
|
|
115
|
-
expected: lednik Patleyna
|
|
116
|
-
- source: полуостров Перник
|
|
117
|
-
expected: poluostrov Pernik
|
|
118
|
-
- source: връх Петко Войвода
|
|
119
|
-
expected: vrah Petko Voyvoda
|
|
120
|
-
- source: остров Фанагория
|
|
121
|
-
expected: ostrov Fanagoriya
|
|
122
|
-
- source: нос Плас
|
|
123
|
-
expected: nos Plas
|
|
124
|
-
- source: Пресиянов рид
|
|
125
|
-
expected: Presiyanov rid
|
|
126
|
-
- source: връх Принсипе де Астуриас
|
|
127
|
-
expected: vrah Prinsipe de Asturias # wiki: vrah Príncipe de Asturias
|
|
128
|
-
- source: нунатак Ръченица
|
|
129
|
-
expected: nunatak Rachenitsa
|
|
130
|
-
- source: връх Райна Княгиня
|
|
131
|
-
expected: vrah Rayna Knyaginya
|
|
132
|
-
- source: Рид Ръжана
|
|
133
|
-
expected: Rid Razhana
|
|
134
|
-
- source: връх Ригс
|
|
135
|
-
expected: vrah Rigs
|
|
136
|
-
- source: остров Рогулят
|
|
137
|
-
expected: ostrov Rogulyat
|
|
138
|
-
- source: ледник Сабазий
|
|
139
|
-
expected: lednik Sabaziy
|
|
140
|
-
- source: ледник Съединение
|
|
141
|
-
expected: lednik Saedinenie
|
|
142
|
-
- source: нунатак Сенокос
|
|
143
|
-
expected: nunatak Senokos
|
|
144
|
-
- source: Сейдолски камък
|
|
145
|
-
expected: Seydolski kamak
|
|
146
|
-
- source: ледник Щерна
|
|
147
|
-
expected: lednik Shterna
|
|
148
|
-
- source: връх Шишман
|
|
149
|
-
expected: vrah Shishman
|
|
150
|
-
- source: ледник Сигмен
|
|
151
|
-
expected: lednik Sigmen
|
|
152
|
-
- source: Седловина Синитово
|
|
153
|
-
expected: Sedlovina Sinitovo
|
|
154
|
-
- source: Ледник Скаплизо
|
|
155
|
-
expected: Lednik Skaplizo
|
|
156
|
-
- source: залив Слънчев бряг
|
|
157
|
-
expected: zaliv Slanchev bryag
|
|
158
|
-
- source: остров Соатрис
|
|
159
|
-
expected: ostrov Soatris
|
|
160
|
-
- source: планина Софийски Университет
|
|
161
|
-
expected: planina Sofiyski Universitet
|
|
162
|
-
- source: ледник Сребърна
|
|
163
|
-
expected: lednik Srebarna
|
|
164
|
-
- source: Средногорски възвишения
|
|
165
|
-
expected: Srednogorski vazvisheniya
|
|
166
|
-
- source: Св. Евтимиев камък
|
|
167
|
-
expected: Sv. Evtimiev kamak
|
|
168
|
-
- source: база Св. Климент Охридски
|
|
169
|
-
expected: baza Sv. Kliment Ohridski
|
|
170
|
-
- source: връх Стъргел
|
|
171
|
-
expected: vrah Stargel
|
|
172
|
-
- source: нунатак Сторгозия
|
|
173
|
-
expected: nunatak Storgoziya # nunatak Storgozia according to wiki
|
|
174
|
-
- source: нунатак Сурвакари
|
|
175
|
-
expected: nunatak Survakari
|
|
176
|
-
- source: ледник Световрачене
|
|
177
|
-
expected: lednik Svetovrachene
|
|
178
|
-
- source: остров Теменуга
|
|
179
|
-
expected: ostrov Temenuga
|
|
180
|
-
- source: Тракийски възвишения
|
|
181
|
-
expected: Trakiyski vazvisheniya
|
|
182
|
-
- source: хълм Цамблак
|
|
183
|
-
expected: halm Tsamblak
|
|
184
|
-
- source: ледник Урдовиза
|
|
185
|
-
expected: lednik Urdoviza
|
|
186
|
-
- source: остров Вълчедръм
|
|
187
|
-
expected: ostrov Valchedram
|
|
188
|
-
- source: острови Вардим
|
|
189
|
-
expected: ostrovi Vardim
|
|
190
|
-
- source: Владигеров проток
|
|
191
|
-
expected: Vladigerov protok
|
|
192
|
-
- source: ледник Ябланица
|
|
193
|
-
expected: lednik Yablanitsa
|
|
194
|
-
- source: залив Ямфорина
|
|
195
|
-
expected: zaliv Yamforina
|
|
196
|
-
- source: Йовков нос
|
|
197
|
-
expected: Yovkov nos
|
|
198
|
-
- source: рид Заберново
|
|
199
|
-
expected: rid Zabernovo
|
|
200
|
-
- source: ледник Збелсурд
|
|
201
|
-
expected: lednik Zbelsurd
|
|
202
|
-
- source: Жефарович камък
|
|
203
|
-
expected: Zhefarovich kamak
|
|
204
|
-
- source: връх Зиези
|
|
205
|
-
expected: vrah Ziezi
|
|
206
|
-
- source: залив Златни пясъци
|
|
207
|
-
expected: zaliv Zlatni pyasatsi
|
|
208
|
-
- source: ледник Злокучене
|
|
209
|
-
expected: lednik Zlokuchene
|
|
210
|
-
- source: проток Злогош
|
|
211
|
-
expected: protok Zlogosh
|
|
212
|
-
|
|
213
|
-
map:
|
|
214
|
-
characters:
|
|
215
|
-
'\u0410': 'A'
|
|
216
|
-
'\u0411': 'B'
|
|
217
|
-
'\u0412': 'V'
|
|
218
|
-
'\u0413': 'G'
|
|
219
|
-
'\u0414': 'D'
|
|
220
|
-
'\u0415': 'E'
|
|
221
|
-
'\u0416': 'Zh'
|
|
222
|
-
'\u0417': 'Z'
|
|
223
|
-
'\u0418': 'I'
|
|
224
|
-
'\u0419': 'Y'
|
|
225
|
-
'\u041a': 'K'
|
|
226
|
-
'\u041b': 'L'
|
|
227
|
-
'\u041c': 'M'
|
|
228
|
-
'\u041d': 'N'
|
|
229
|
-
'\u041e': 'O'
|
|
230
|
-
'\u041f': 'P'
|
|
231
|
-
'\u0420': 'R'
|
|
232
|
-
'\u0421': 'S'
|
|
233
|
-
'\u0422': 'T'
|
|
234
|
-
'\u0423': 'U'
|
|
235
|
-
'\u0424': 'F'
|
|
236
|
-
'\u0425': 'H'
|
|
237
|
-
'\u0426': 'Ts'
|
|
238
|
-
'\u0427': 'Ch'
|
|
239
|
-
'\u0428': 'Sh'
|
|
240
|
-
'\u0429': 'Sht'
|
|
241
|
-
'\u042a': 'A'
|
|
242
|
-
'\u042c': 'Y'
|
|
243
|
-
'\u042e': 'Yu'
|
|
244
|
-
'\u042f': 'Ya'
|
|
245
|
-
|
|
246
|
-
'\u0430': 'a'
|
|
247
|
-
'\u0431': 'b'
|
|
248
|
-
'\u0432': 'v'
|
|
249
|
-
'\u0433': 'g'
|
|
250
|
-
'\u0434': 'd'
|
|
251
|
-
'\u0435': 'e'
|
|
252
|
-
'\u0436': 'zh'
|
|
253
|
-
'\u0437': 'z'
|
|
254
|
-
'\u0438': 'i'
|
|
255
|
-
'\u0439': 'y'
|
|
256
|
-
'\u043a': 'k'
|
|
257
|
-
'\u043b': 'l'
|
|
258
|
-
'\u043c': 'm'
|
|
259
|
-
'\u043d': 'n'
|
|
260
|
-
'\u043e': 'o'
|
|
261
|
-
'\u043f': 'p'
|
|
262
|
-
'\u0440': 'r'
|
|
263
|
-
'\u0441': 's'
|
|
264
|
-
'\u0442': 't'
|
|
265
|
-
'\u0443': 'u'
|
|
266
|
-
'\u0444': 'f'
|
|
267
|
-
'\u0445': 'h'
|
|
268
|
-
'\u0446': 'ts'
|
|
269
|
-
'\u0447': 'ch'
|
|
270
|
-
'\u0448': 'sh'
|
|
271
|
-
'\u0449': 'sht'
|
|
272
|
-
'\u044a': 'a'
|
|
273
|
-
'\u044c': 'y'
|
|
274
|
-
'\u044e': 'yu'
|
|
275
|
-
'\u044f': 'ya'
|
|
276
|
-
|
|
277
|
-
# note 2
|
|
278
|
-
'\u046A': "U\u0306" # Ѫ
|
|
279
|
-
'\u046B': "u\u0306" # ѫ
|
|
280
|
-
|
|
281
|
-
# note[3]
|
|
282
|
-
'\u0462': "YE" # Ѣ
|
|
283
|
-
'\u0463': "ye" # ѣ
|
|
@@ -1,174 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: bas
|
|
3
|
-
id: 2017-bss
|
|
4
|
-
language: iso-639-2:rus
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: Streamlined Romanization of Russian Cyrillic -- Basic Streamlined System
|
|
8
|
-
url: https://www.researchgate.net/publication/318402098
|
|
9
|
-
creation_date: 2017-07
|
|
10
|
-
description: |
|
|
11
|
-
The streamlined approach to transliteration was initiated by the
|
|
12
|
-
author with the development of the Streamlined System for the
|
|
13
|
-
Romanization of Bulgarian, which was eventually codified by the
|
|
14
|
-
Transliteration Act of 2009 (ДВ 2009) of the Bulgarian Parliament.
|
|
15
|
-
|
|
16
|
-
The four purposes of the system below are in order of priority:
|
|
17
|
-
1. ensure a plausible phonetic approximation of Russian words by English speaking users, including those having no knowledge of the Russian language and no available additional explanations;
|
|
18
|
-
2. the system should allow for the retrieval of the original Cyrillic spellings as much as feasible;
|
|
19
|
-
3. transliterated Russian words should fit an English language environment i.e. not be perceived as too ‘un-English’; and
|
|
20
|
-
4. transliterated word forms should be streamlined and simple. (Ivanov 2003, Ivanov et al. 2010)
|
|
21
|
-
|
|
22
|
-
notes:
|
|
23
|
-
- Typical for the streamlined approach is its non-use of diacritics,
|
|
24
|
-
its use of Latin y for rendering only Cyrillic й rather than both й and
|
|
25
|
-
ы, its non-use of Latin j, as well as its use of Latin h rather than kh
|
|
26
|
-
for Cyrillic х.
|
|
27
|
-
|
|
28
|
-
tests:
|
|
29
|
-
- source: |
|
|
30
|
-
Эх, тройка! птица тройка, кто тебя выдумал? знать, у бойкого народа
|
|
31
|
-
ты могла только родиться, в той земле, что не любит шутить, а
|
|
32
|
-
ровнем-гладнем разметнулась на полсвета, да и ступай считать версты, пока
|
|
33
|
-
не зарябит тебе в очи. И не хитрый, кажись, дорожный снаряд, не
|
|
34
|
-
железным схвачен винтом, а наскоро живьём с одним топором да долотом
|
|
35
|
-
снарядил и собрал тебя ярославский расторопный мужик. Не в немецких
|
|
36
|
-
ботфортах ямщик: борода да рукавицы, и сидит чёрт знает на чём; а
|
|
37
|
-
привстал, да замахнулся, да затянул песню — кони вихрем, спицы в
|
|
38
|
-
колесах смешались в один гладкий круг, только дрогнула дорога, да вскрикнул
|
|
39
|
-
в испуге остановившийся пешеход — и вон она понеслась, понеслась,
|
|
40
|
-
понеслась!
|
|
41
|
-
|
|
42
|
-
Н.В. Гоголь
|
|
43
|
-
expected: |
|
|
44
|
-
Eh, troyka! ptitsa troyka, kto tebya vidumal? znat, u boykogo naroda
|
|
45
|
-
ti mogla tolko roditsya, v toy zemle, chto ne lyubit shutit, a
|
|
46
|
-
rovnem-gladnem razmetnulas na polsveta, da i stupay schitat versti, poka
|
|
47
|
-
ne zaryabit tebe v ochi. I ne hitriy, kazhis, dorozhniy snaryad, ne
|
|
48
|
-
zheleznim shvachen vintom, a naskoro zhivyem s odnim toporom da dolotom
|
|
49
|
-
snaryadil i sobral tebya yaroslavskiy rastoropniy muzhik. Ne v nemetskih
|
|
50
|
-
botfortah yamshchik: boroda da rukavitsi, i sidit chert znaet na chem; a
|
|
51
|
-
privstal, da zamahnulsya, da zatyanul pesnyu — koni vihrem, spitsi v
|
|
52
|
-
kolesah smeshalis v odin gladkiy krug, tolko drognula doroga, da vskriknul
|
|
53
|
-
v ispuge ostanovivshiysya peshehod — i von ona poneslas, poneslas,
|
|
54
|
-
poneslas!
|
|
55
|
-
|
|
56
|
-
N.V. Gogol
|
|
57
|
-
|
|
58
|
-
- source: ЁЖ Ёж ёж
|
|
59
|
-
expected: EZH Ezh ezh
|
|
60
|
-
- source: Цветущий сад
|
|
61
|
-
expected: Tsvetushchiy sad
|
|
62
|
-
- source: Чувство юмора
|
|
63
|
-
expected: Chuvstvo yumora
|
|
64
|
-
- source: Широкий выбор
|
|
65
|
-
expected: Shirokiy vibor
|
|
66
|
-
- source: Все подъезды заблокированны
|
|
67
|
-
expected: Vse podezdi zablokirovanni
|
|
68
|
-
- source: Ожерелье
|
|
69
|
-
expected: Ozherelye
|
|
70
|
-
- source: Ручьи
|
|
71
|
-
expected: Ruchyi
|
|
72
|
-
- source: Каньон
|
|
73
|
-
expected: Kanyon
|
|
74
|
-
- source: Бельэтаж
|
|
75
|
-
expected: Belyetazh
|
|
76
|
-
|
|
77
|
-
map:
|
|
78
|
-
rules:
|
|
79
|
-
- pattern: \u042c(?=[ЕеЁёИиОоЭэ]) # Ь (before Е, Ё, И, O, Э)
|
|
80
|
-
result: Y
|
|
81
|
-
- pattern: \u044c(?=[ЕеЁёИиОоЭэ]) # ь (before Е, Ё, И, O, Э)
|
|
82
|
-
result: y
|
|
83
|
-
|
|
84
|
-
characters:
|
|
85
|
-
# "\u0027": "" # '
|
|
86
|
-
"\u0410": "A" # А
|
|
87
|
-
"\u0411": "B" # Б
|
|
88
|
-
"\u0412": "V" # В
|
|
89
|
-
"\u0413": "G" # Г
|
|
90
|
-
"\u0414": "D" # Д
|
|
91
|
-
"\u0401": "E" # Ё
|
|
92
|
-
"\u0415": "E" # Е
|
|
93
|
-
"\u0416": "Zh" # Ж
|
|
94
|
-
"\u0417": "Z" # З
|
|
95
|
-
"\u042D": "E" # Э
|
|
96
|
-
"\u0418": "I" # И
|
|
97
|
-
"\u0419": "Y" # Й
|
|
98
|
-
"\u041A": "K" # К
|
|
99
|
-
"\u041B": "L" # Л
|
|
100
|
-
"\u041C": "M" # М
|
|
101
|
-
"\u041D": "N" # Н
|
|
102
|
-
"\u041E": "O" # О
|
|
103
|
-
"\u041F": "P" # П
|
|
104
|
-
"\u0420": "R" # Р
|
|
105
|
-
"\u0421": "S" # С
|
|
106
|
-
"\u0422": "T" # Т
|
|
107
|
-
"\u0423": "U" # У
|
|
108
|
-
"\u0424": "F" # Ф
|
|
109
|
-
"\u0425": "H" # Х
|
|
110
|
-
"\u0426": "Ts" # Ц
|
|
111
|
-
"\u0427": "Ch" # Ч
|
|
112
|
-
"\u0428": "Sh" # Ш
|
|
113
|
-
"\u0429": "Shch" # Щ
|
|
114
|
-
"\u042B": "I" # Ы
|
|
115
|
-
"\u042F": "Ya" # Я
|
|
116
|
-
"\u042E": "Yu" # Ю
|
|
117
|
-
|
|
118
|
-
# Ь (before Е, Ё, И, O, Э)
|
|
119
|
-
# "\u042c\u0401": "YE" # Ё
|
|
120
|
-
# "\u042c\u0415": "YE" # Е
|
|
121
|
-
# "\u042c\u0418": "YI" # И
|
|
122
|
-
# "\u042c\u041E": "YO" # O
|
|
123
|
-
# "\u042c\u0417": "YE" # Э
|
|
124
|
-
|
|
125
|
-
# Ь (otherwise) -> (none)
|
|
126
|
-
"\u042c": ""
|
|
127
|
-
|
|
128
|
-
# Ъ -> (none)
|
|
129
|
-
"\u042a": ""
|
|
130
|
-
|
|
131
|
-
"\u0430": "a" # а
|
|
132
|
-
"\u0431": "b" # б
|
|
133
|
-
"\u0432": "v" # в
|
|
134
|
-
"\u0433": "g" # г
|
|
135
|
-
"\u0434": "d" # д
|
|
136
|
-
"\u0451": "e" # ё
|
|
137
|
-
"\u0435": "e" # e
|
|
138
|
-
"\u0436": "zh" # ж
|
|
139
|
-
"\u0437": "z" # з
|
|
140
|
-
"\u044D": "e" # э
|
|
141
|
-
"\u0438": "i" # и
|
|
142
|
-
"\u0439": "y" # й
|
|
143
|
-
"\u043A": "k" # к
|
|
144
|
-
"\u043B": "l" # л
|
|
145
|
-
"\u043C": "m" # м
|
|
146
|
-
"\u043D": "n" # н
|
|
147
|
-
"\u043E": "o" # о
|
|
148
|
-
"\u043F": "p" # п
|
|
149
|
-
"\u0440": "r" # р
|
|
150
|
-
"\u0441": "s" # с
|
|
151
|
-
"\u0442": "t" # т
|
|
152
|
-
"\u0443": "u" # у
|
|
153
|
-
"\u0444": "f" # ф
|
|
154
|
-
"\u0445": "h" # х
|
|
155
|
-
"\u0446": "ts" # ц
|
|
156
|
-
"\u0447": "ch" # ч
|
|
157
|
-
"\u0448": "sh" # ш
|
|
158
|
-
"\u0449": "shch" # щ
|
|
159
|
-
"\u044B": "i" # ы
|
|
160
|
-
"\u044F": "ya" # я
|
|
161
|
-
"\u044E": "yu" # ю
|
|
162
|
-
|
|
163
|
-
# ь (before е, ё, и, o, э)
|
|
164
|
-
# "\u044c\u0435": "ye" # ё
|
|
165
|
-
# "\u044c\u0451": "ye" # е
|
|
166
|
-
# "\u044c\u0438": "yi" # и
|
|
167
|
-
# "\u044c\u006f": "yo" # o
|
|
168
|
-
# "\u044c\u044d": "ye" # э
|
|
169
|
-
|
|
170
|
-
# ь (otherwise) -> (none)
|
|
171
|
-
"\u044c": ""
|
|
172
|
-
|
|
173
|
-
# ъ -> (none)
|
|
174
|
-
"\u044a": ""
|