interscript 0.1.9 → 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +80 -135
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +73 -458
- data/README.adoc +0 -296
- data/aliases.json +0 -1
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -96
- data/lib/interscript/mapping.rb +0 -144
- data/lib/interscript/opal.rb +0 -196
- data/lib/interscript/opal/entrypoint.rb +0 -20
- data/lib/interscript/opal/exports.rb +0 -11
- data/lib/interscript/opal/maps.js.erb +0 -8
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
- data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
- data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
- data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
- data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
- data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
- data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
- data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
- data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
- data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
- data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
- data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
- data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -21
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -37
- data/spec/spec_helper.rb +0 -3
@@ -1,73 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 2012
|
4
|
-
language: iso-639-2:mal
|
5
|
-
source_script: Mlym
|
6
|
-
destination_script: Latn
|
7
|
-
name: Malayalam Romanization, 2012
|
8
|
-
alias:
|
9
|
-
ogc11122:
|
10
|
-
code: mal_Mlym2Latn_ALA_2012
|
11
|
-
description: Malayalam ALA-Library of Congress 2012 System
|
12
|
-
url: https://www.loc.gov/catdir/cpso/romanization/malayalam.pdf
|
13
|
-
creation_date: 2012
|
14
|
-
description: |
|
15
|
-
ALA-LC Romanization table for Malayalam
|
16
|
-
|
17
|
-
|
18
|
-
notes:
|
19
|
-
|
20
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
21
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
22
|
-
made in transliteration.
|
23
|
-
|
24
|
-
- When ് is used in combination with the vowel u (ഉ്), the combination is also transliterated ȧ.
|
25
|
-
|
26
|
-
- |
|
27
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in transliteration, with the following exceptions:
|
28
|
-
a) when another vowel is indicated by its appropriate sign
|
29
|
-
b) when the absence of any vowel is indicated by the superscript sign ് (also used for the vowel ȧ); and
|
30
|
-
c) when the following modified consonantal forms are used:
|
31
|
-
ൿ k
|
32
|
-
ൻ n
|
33
|
-
ൾ ḷ
|
34
|
-
ൺ ṇ
|
35
|
-
ൽ l
|
36
|
-
ർ r
|
37
|
-
- When റ റ appears as a subscript in a cluster (റ്റ), it is transliterated ta.
|
38
|
-
|
39
|
-
- |
|
40
|
-
Exception: Anusvāra is transliterated by:
|
41
|
-
|
42
|
-
a) ṅ before gutturals,
|
43
|
-
b) ñ before palatals,
|
44
|
-
c) ṇ before cerebrals,
|
45
|
-
d) n before dentals, and
|
46
|
-
e) m before labials.
|
47
|
-
|
48
|
-
tests:
|
49
|
-
- source: "ബാർ കോഴ ആവിയായി; മകൻ മാണിയെ വ്യക്തിഹത്യ നടത്തിയവരുടെ കൂടാരത്തിൽ"
|
50
|
-
expected: "bār kōḻa āviyāyi; makan māṇiye vŭyakŭtihatŭya naṭatŭtiyavaruṭe kūṭāratŭtil"
|
51
|
-
- source: "മിഷൻ ശക്തി, ഓപറേഷൻ ശക്തി'; മുഖം മിനുക്കാൻ സ്ത്രീസുരക്ഷാ പദ്ധതികളുമായി"
|
52
|
-
expected: "miṣan śakŭti, ōpaṟēṣan śakŭti'; mukhaṃ minukŭkān sŭtŭrīsurakŭṣā padŭdhatikaḷumāyi"
|
53
|
-
- source: "സംസ്ഥാനത്ത് ബുധനാഴ്ച 6,244 പേര്ക്ക് കോവിഡ്; ൫൭൪൫ പേര്ക്ക് രോഗം സമ"
|
54
|
-
expected: "saṃsŭthānatŭtŭ budhanāḻŭca 6,244 pērŭkŭkŭ kōvid̂ŭ; 5745 pērŭkŭkŭ rēāgaṃ sama"
|
55
|
-
- source: "ശബരിമല തീര്ഥാടനം: സ്പെഷല് കമ്മീഷ്ണറുടെ റിപ്പോര്ട്ട് ഹൈകോടതിയില്"
|
56
|
-
expected: "śabarimala tīrŭthāṭanaṃ: sŭpeṣalŭ kamŭmīṣŭṇaṟuṭe ṟipŭpōrŭṭŭṭŭ haikōṭatiyilŭ"
|
57
|
-
- source: "സജ്ന ഷാജിക്ക് ഐക്യദാര്ഢ്യവുമായി സന്തോഷ് കീഴാറ്റൂര് ബിരിയാണി വില്ക്കും"
|
58
|
-
expected: "sajŭna ṣājikŭkŭ aikŭyadārŭḍhŭyavumāyi sanŭtōṣŭ kīḻāṟŭṟūrŭ biriyāṇi vilŭkŭkuṃ"
|
59
|
-
- source: "ആനപ്പുറത്തിരുന്ന് യോഗാഭ്യാസത്തിനിടെ ബാബ രാംദേവ് നിലത്തുവീണു"
|
60
|
-
expected: "ānapŭpuṟatŭtirunŭnŭ yēāgābhŭyāsatŭtiniṭe bāba rāṃdēvŭ nilatŭtuvīṇu"
|
61
|
-
- source: "സാധാരണക്കാരെൻറ ദീപാവലി നിങ്ങളുടെ കൈയിൽ; മൊറട്ടോറിയം കേസിൽ കേന്ദ്രത്തോട് സുപ്രീംകോടതി"
|
62
|
-
expected: "sādhāraṇakŭkārenṟa dīpāvali niṅŭṅaḷuṭe kaiyil; meāṟaṭŭṭēāṟiyaṃ kēsil kēnŭdŭratŭtēāṭŭ supŭrīṃkēāṭati"
|
63
|
-
- source: "മാണി ഉണ്ടായിരുന്നെങ്കിൽ ഇത്തരമൊരു തീരുമാനം എടുക്കില്ല, ഈ രാഷ്ട്രീയ വഞ്ചന അദ്ദേഹത്തിന്റെ ആത്മാവ് പൊറുക്കില്ല"
|
64
|
-
expected: "māṇi uṇŭṭāyirunŭneṅŭkil itŭtaramoru tīrumānaṃ eṭukŭkilŭla, ī rāṣŭṭŭrīya vañŭcana adŭdēhatŭtinŭṟe ātŭmāvŭ poṟukŭkilŭla"
|
65
|
-
- source: "ധാർമികത വിളമ്പണ്ട, എം.പി, എം.എൽ.എ സ്ഥാനങ്ങൾ രാജിവെക്കൂ എന്ന് ജോസ് കെ. മാണിയോട് ഷാഫി"
|
66
|
-
expected: "dhārmikata viḷamŭpaṇŭṭa, eṃ.pi, eṃ.el.e sŭthānaṅŭṅaḷ rājivekŭkū enŭnŭ jōsŭ ke. māṇiyōṭŭ ṣāphi"
|
67
|
-
- source: "ഞങ്ങൾ ബോക്സിൽ നിന്നും ഒന്നും ഒഴിവാക്കില്ല; ആപ്പിളിനെ ട്രോളി ഷവോമി"
|
68
|
-
expected: "ñaṅŭṅaḷ bēākŭsil ninŭnuṃ onŭnuṃ oḻivākŭkilŭla; āpŭpiḷine ṭŭrēāḷi ṣavēāmi"
|
69
|
-
|
70
|
-
|
71
|
-
map:
|
72
|
-
|
73
|
-
inherit: 'alalc-mal-Mlym-Latn-1997'
|
@@ -1,189 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 1997
|
4
|
-
language: iso-639-2:mar
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: Marathi Romanization, 1997
|
8
|
-
alias:
|
9
|
-
ogc11122:
|
10
|
-
code: mar_Deva2Latn_ALA_1997
|
11
|
-
description: Marathi ALA-Library of Congress 1997 System
|
12
|
-
url: http://catdir.loc.gov/catdir/cpso/romanization/marathi.pdf
|
13
|
-
creation_date: 1997
|
14
|
-
description: |
|
15
|
-
ALA-LC Romanization table for Marathi
|
16
|
-
|
17
|
-
notes:
|
18
|
-
|
19
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
20
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
21
|
-
made in transliteration.
|
22
|
-
|
23
|
-
- |
|
24
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
25
|
-
transliteration, with the following exceptions:
|
26
|
-
|
27
|
-
a) when another vowel is indicated by its appropriate sign; and
|
28
|
-
b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
|
29
|
-
virāma.
|
30
|
-
|
31
|
-
- |
|
32
|
-
Exception: Anusvāra is transliterated by:
|
33
|
-
|
34
|
-
a) ṅ before gutturals,
|
35
|
-
b) ñ before palatals,
|
36
|
-
c) ṇ before cerebrals,
|
37
|
-
d) n before dentals, and
|
38
|
-
e) m before labials.
|
39
|
-
In other circumstances it is transliterated by a tilde (~) over the vowel.
|
40
|
-
|
41
|
-
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
42
|
-
|
43
|
-
tests:
|
44
|
-
- source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
|
45
|
-
expected: "ṭhaāṇae - jailahayaāta baudhavaāraī eka hajaāra raugaṇaāñcaī vaāḍha, tara jaṇaāñcayaā maṛitayaūcaī naonda"
|
46
|
-
- source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
|
47
|
-
expected: "ekataā kapaūra paunahaā aḍakalaī vaādaāta, vaebasaīraijamadhalayaā 'tayaā' saīnamaulae jamaāvaācaī gharaāvara dagaḍaphaeka"
|
48
|
-
- source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
|
49
|
-
expected: "jaāṇaūna ghayaā, baīemasaīcayaā adhaikaāऱyaānnaī kaṅganaā raāṇaautacayaā ôphaisamadhalae nakakaī kaāya- kaāya taoḍalam"
|
50
|
-
- source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
|
51
|
-
expected: "kaṅganaā maumbaīta daākhala haoṇayaāpaūravaī 'maātaośaraī'varaūna pharamaāna sauṭalae; paravakatayaānnaā sakata ādaeśa"
|
52
|
-
- source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
|
53
|
-
expected: "maraāṭhaā ārakashaṇaāsa taātapaurataī sathagaitaī; saravaocaca nayaāyaālayaācaā nairaṇaya"
|
54
|
-
- source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
|
55
|
-
expected: "bhaārataācayaā tainahaī laśaīñcaā pahailaā ṭapapaā yaśasavaī, vaācaā kadhaī yaeṇaāra baājaāraāta"
|
56
|
-
- source: "रुग्णवाढीमुळे खाटांची चणचण"
|
57
|
-
expected: "raugaṇavaāḍhaīmaulae khaāṭaāñcaī caṇacaṇa"
|
58
|
-
- source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
|
59
|
-
expected: "paīema savanaidhaī karaja yaojanaelaā maumbaītaūna alapa parataisaāda"
|
60
|
-
- source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
|
61
|
-
expected: "saāntaākaraūjha-caembaūra laiṅka raoḍavaraīla unanata maāragaālaā sathagaitaī"
|
62
|
-
- source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
|
63
|
-
expected: "sampaādaka araṇaba gaosavaāmaī yaāñcayaāvairaūdadha khaḍaka paolaisa ṭhaāṇayaāta takaraāra"
|
64
|
-
- source: "२५६८७५४४६४४६१६११"
|
65
|
-
expected: "2568754464461611"
|
66
|
-
|
67
|
-
map:
|
68
|
-
|
69
|
-
rules:
|
70
|
-
# note[3]
|
71
|
-
- pattern: \u0902(?=[कखगघङ])
|
72
|
-
result: ṅ
|
73
|
-
- pattern: \u0902(?=[चछजझञ])
|
74
|
-
result: ñ
|
75
|
-
- pattern: \u0902(?=[टठडढण])
|
76
|
-
result: ṇ
|
77
|
-
- pattern: \u0902(?=[तथदधन])
|
78
|
-
result: n
|
79
|
-
|
80
|
-
characters:
|
81
|
-
|
82
|
-
# I. Vowels and Diphthongs (see Note 1)
|
83
|
-
|
84
|
-
'अ': 'a'
|
85
|
-
'आ': 'ā'
|
86
|
-
'इ': 'i'
|
87
|
-
'ई': 'ī'
|
88
|
-
'उ': 'u'
|
89
|
-
'ऊ': 'ū'
|
90
|
-
'ऋ': 'ṛ'
|
91
|
-
'ॠ': 'ṝ'
|
92
|
-
'ऌ': 'ḹ'
|
93
|
-
#'ॳ': 'ĕ'
|
94
|
-
'ए': 'e'
|
95
|
-
'ॲ': 'ê'
|
96
|
-
#'अै': 'ai'
|
97
|
-
'ऐ': 'ai'
|
98
|
-
#'ऒ': 'ŏ'
|
99
|
-
'ओ': 'o'
|
100
|
-
'ऑ': 'ô'
|
101
|
-
'औ': 'ău'
|
102
|
-
|
103
|
-
# II. Consonants
|
104
|
-
# Gutturals
|
105
|
-
'क': 'ka'
|
106
|
-
'ख': 'kha'
|
107
|
-
'ग': 'ga'
|
108
|
-
'घ': 'gha'
|
109
|
-
'ङ': 'ṅa'
|
110
|
-
|
111
|
-
# Palatals
|
112
|
-
'च': 'ca'
|
113
|
-
'छ': 'cha'
|
114
|
-
'ज': 'ja'
|
115
|
-
'झ': 'jha'
|
116
|
-
'ञ': 'ña'
|
117
|
-
|
118
|
-
# Cerebrals
|
119
|
-
'ट': 'ṭa'
|
120
|
-
'ठ': 'ṭha'
|
121
|
-
'ड': 'ḍa'
|
122
|
-
#'ड़': 'ṛa'
|
123
|
-
'ढ': 'ḍha'
|
124
|
-
#'ढ़': 'ṛha'
|
125
|
-
'ण': 'ṇa'
|
126
|
-
|
127
|
-
# Dentals
|
128
|
-
'त': 'ta'
|
129
|
-
'थ': 'tha'
|
130
|
-
'द': 'da'
|
131
|
-
'ध': 'dha'
|
132
|
-
'न': 'na'
|
133
|
-
|
134
|
-
# Labials
|
135
|
-
'प': 'pa'
|
136
|
-
'फ': 'pha'
|
137
|
-
'ब': 'ba'
|
138
|
-
'भ': 'bha'
|
139
|
-
'म': 'ma'
|
140
|
-
|
141
|
-
# Semivowels
|
142
|
-
'य': 'ya'
|
143
|
-
'र': 'ra'
|
144
|
-
'ल': 'la'
|
145
|
-
'ळ': 'la'
|
146
|
-
'व': 'va'
|
147
|
-
|
148
|
-
# Sibilants
|
149
|
-
'श': 'śa'
|
150
|
-
'ष': 'sha'
|
151
|
-
'स': 'sa'
|
152
|
-
|
153
|
-
# Aspirate
|
154
|
-
'ह': 'ha'
|
155
|
-
|
156
|
-
# Anusvāra
|
157
|
-
'ं': 'm'
|
158
|
-
|
159
|
-
# Bisarga
|
160
|
-
'ः ': 'ḥ'
|
161
|
-
|
162
|
-
# Abagraha
|
163
|
-
'ऽ': '’' # (apostrophe)
|
164
|
-
|
165
|
-
# Medials # Needed for connecting constants
|
166
|
-
'ा': "ā"
|
167
|
-
'ि': "i"
|
168
|
-
'ी': "ī"
|
169
|
-
'ु': "u"
|
170
|
-
'ू': "ū"
|
171
|
-
'ृ': "ṛi"
|
172
|
-
'ॄ': "rī"
|
173
|
-
'े': "e"
|
174
|
-
'ो': "o"
|
175
|
-
'ौ': "au"
|
176
|
-
'्': ''
|
177
|
-
|
178
|
-
# digits
|
179
|
-
|
180
|
-
'०': '0'
|
181
|
-
'१': '1'
|
182
|
-
'२': '2'
|
183
|
-
'३': '3'
|
184
|
-
'४': '4'
|
185
|
-
'५': '5'
|
186
|
-
'६': '6'
|
187
|
-
'७': '7'
|
188
|
-
'८': '8'
|
189
|
-
'९': '9'
|
@@ -1,45 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 2011
|
4
|
-
language: iso-639-2:mar
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: Marathi Romanization, 2011
|
8
|
-
url: https://loc.gov/catdir/cpso/romanization/marathi.pdf
|
9
|
-
creation_date: 1997
|
10
|
-
description: |
|
11
|
-
ALA-LC Romanization table for Marathi
|
12
|
-
|
13
|
-
notes:
|
14
|
-
|
15
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
-
made in transliteration.
|
18
|
-
|
19
|
-
- |
|
20
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
-
transliteration, with the following exceptions:
|
22
|
-
|
23
|
-
a) when another vowel is indicated by its appropriate sign; and
|
24
|
-
b) when the absence of any vowel is indicated by the subscript sign ( ् ) called halanta or
|
25
|
-
virāma.
|
26
|
-
|
27
|
-
- |
|
28
|
-
Exception: Anusvāra is transliterated by:
|
29
|
-
|
30
|
-
a) ṅ before gutturals,
|
31
|
-
b) ñ before palatals,
|
32
|
-
c) ṇ before cerebrals,
|
33
|
-
d) n before dentals, and
|
34
|
-
e) m before labials.
|
35
|
-
In other circumstances it is transliterated by a tilde (~) over the vowel.
|
36
|
-
|
37
|
-
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
38
|
-
|
39
|
-
tests:
|
40
|
-
- source: "कोरोनाच्या लढाईत पोलीस थकलेत, पण हिंमत हरलेले नाहीत; गृहमंत्र्यांकडून कौतुक"
|
41
|
-
expected: "kaoraonaācayaā laḍhaāīta paolaīsa thakalaeta, paṇa haimmata haralaelae naāhaīta; gaṛihamantarayaāṅkaḍaūna kaautauka"
|
42
|
-
|
43
|
-
map:
|
44
|
-
|
45
|
-
inherit: "alalc-mar-Deva-Latn-1997"
|
@@ -1,114 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 1997
|
4
|
-
language: iso-639-2:mkd
|
5
|
-
source_script: Cyrl
|
6
|
-
destination_script: Latn
|
7
|
-
name: Serbian and Makedonian Romanization, ALA-LC 1997 System
|
8
|
-
url: http://catdir.loc.gov/catdir/cpso/romanization/serbian.pdf
|
9
|
-
creation_date: 1997
|
10
|
-
description: ALA-LC Romanization table for Serbian and Makedonian.
|
11
|
-
|
12
|
-
notes:
|
13
|
-
- Special characters in romanization
|
14
|
-
Đ - D with crossbar (upper case). USMARC hexadecimal code A3.
|
15
|
-
đ - d with crossbar (upper case). USMARC hexadecimal code B3.
|
16
|
-
|
17
|
-
- Character modifiers in romanization
|
18
|
-
´ - acute. USMARC hexadecimal code E2.
|
19
|
-
ˇ - hachek. USMARC hexadecimal code E9.
|
20
|
-
|
21
|
-
tests:
|
22
|
-
- source: Општина Ердут
|
23
|
-
expected: Opština Erdut
|
24
|
-
- source: Општина Двор
|
25
|
-
expected: Opština Dvor
|
26
|
-
- source: ЛУЃЕ луѓе
|
27
|
-
expected: LUǴE luǵe
|
28
|
-
- source: ЅВЕЗДА ѕвезда Ѕвезда
|
29
|
-
expected: DZVEZDA dzvezda Dzvezda
|
30
|
-
- source: ЌАРУВАЊЕ ќарување
|
31
|
-
expected: ḰARUVANJE ḱaruvanje
|
32
|
-
|
33
|
-
map:
|
34
|
-
postrules:
|
35
|
-
# DZ
|
36
|
-
- pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
|
37
|
-
result: "DZ"
|
38
|
-
#LJ
|
39
|
-
- pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
|
40
|
-
result: "LJ"
|
41
|
-
#NJ
|
42
|
-
- pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
|
43
|
-
result: "NJ"
|
44
|
-
#DŽ
|
45
|
-
- pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
|
46
|
-
result: "DŽ"
|
47
|
-
|
48
|
-
characters:
|
49
|
-
"\u0410": "A"
|
50
|
-
"\u0411": "B"
|
51
|
-
"\u0412": "V"
|
52
|
-
"\u0413": "G"
|
53
|
-
"\u0403": "\u01F4" # Ǵ
|
54
|
-
"\u0414": "D"
|
55
|
-
"\u0402": "\u0110" # Đ
|
56
|
-
"\u0415": "E"
|
57
|
-
"\u0416": "\u005a\u030c" # Ž
|
58
|
-
"\u0417": "Z"
|
59
|
-
"\u0405": "Dz"
|
60
|
-
"\u0418": "I"
|
61
|
-
"\u0408": "J"
|
62
|
-
"\u041A": "K"
|
63
|
-
"\u040C": "\u1E30" # Ḱ
|
64
|
-
"\u041B": "L"
|
65
|
-
"\u0409": "Lj"
|
66
|
-
"\u041C": "M"
|
67
|
-
"\u041D": "N"
|
68
|
-
"\u040A": "Nj"
|
69
|
-
"\u041E": "O"
|
70
|
-
"\u041F": "P"
|
71
|
-
"\u0420": "R"
|
72
|
-
"\u0421": "S"
|
73
|
-
"\u0422": "T"
|
74
|
-
"\u040B": "\u0043\u0301" # Ć
|
75
|
-
"\u0423": "U"
|
76
|
-
"\u0424": "F"
|
77
|
-
"\u0425": "H"
|
78
|
-
"\u0426": "C"
|
79
|
-
"\u0427": "\u0043\u030c" # Č
|
80
|
-
"\u040F": "D\u007a\u030c" # Dž
|
81
|
-
"\u0428": "\u0053\u030c" # Š
|
82
|
-
"\u0430": "a"
|
83
|
-
"\u0431": "b"
|
84
|
-
"\u0432": "v"
|
85
|
-
"\u0433": "g"
|
86
|
-
"\u0453": "\u01F5" # ǵ
|
87
|
-
"\u0434": "d"
|
88
|
-
"\u0452": "\u0111" # đ
|
89
|
-
"\u0435": "e"
|
90
|
-
"\u0436": "\u007a\u030c" # ž
|
91
|
-
"\u0437": "z"
|
92
|
-
"\u0455": "dz"
|
93
|
-
"\u0438": "i"
|
94
|
-
"\u0458": "j"
|
95
|
-
"\u043A": "k"
|
96
|
-
"\u045C": "\u1E31" # ḱ
|
97
|
-
"\u043B": "l"
|
98
|
-
"\u0459": "lj"
|
99
|
-
"\u043C": "m"
|
100
|
-
"\u043D": "n"
|
101
|
-
"\u045A": "nj"
|
102
|
-
"\u043E": "o"
|
103
|
-
"\u043F": "p"
|
104
|
-
"\u0440": "r"
|
105
|
-
"\u0441": "s"
|
106
|
-
"\u0442": "t"
|
107
|
-
"\u045B": "\u0063\u0301" # ć
|
108
|
-
"\u0443": "u"
|
109
|
-
"\u0444": "f"
|
110
|
-
"\u0445": "h"
|
111
|
-
"\u0446": "c"
|
112
|
-
"\u0447": "\u0063\u030c" # č
|
113
|
-
"\u045F": "d\u007a\u030c" # dž
|
114
|
-
"\u0448": "\u0073\u030c" # š
|
@@ -1,103 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 2013
|
4
|
-
language: iso-639-2:mkd
|
5
|
-
source_script: Cyrl
|
6
|
-
destination_script: Latn
|
7
|
-
name: Makedonian Romanization, ALA-LC 2013 System
|
8
|
-
url: https://www.loc.gov/catdir/cpso/romanization/macedonian.pdf
|
9
|
-
creation_date: 2013
|
10
|
-
description: ALA-LC Romanization table for Makedonian.
|
11
|
-
|
12
|
-
tests:
|
13
|
-
- source: Општина Ердут
|
14
|
-
expected: Opština Erdut
|
15
|
-
- source: Општина Двор
|
16
|
-
expected: Opština Dvor
|
17
|
-
- source: ЛУЃЕ луѓе
|
18
|
-
expected: LUǴE luǵe
|
19
|
-
- source: ЅВЕЗДА ѕвезда Ѕвезда
|
20
|
-
expected: DZVEZDA dzvezda Dzvezda
|
21
|
-
- source: ЌАРУВАЊЕ ќарување
|
22
|
-
expected: ḰARUVANJE ḱaruvanje
|
23
|
-
|
24
|
-
map:
|
25
|
-
postrules:
|
26
|
-
# DZ
|
27
|
-
- pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
|
28
|
-
result: "DZ"
|
29
|
-
#LJ
|
30
|
-
- pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
|
31
|
-
result: "LJ"
|
32
|
-
#NJ
|
33
|
-
- pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
|
34
|
-
result: "NJ"
|
35
|
-
#DŽ
|
36
|
-
- pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
|
37
|
-
result: "DŽ"
|
38
|
-
|
39
|
-
characters:
|
40
|
-
"\u0410": "A"
|
41
|
-
"\u0411": "B"
|
42
|
-
"\u0412": "V"
|
43
|
-
"\u0413": "G"
|
44
|
-
"\u0403": "\u01F4" # Ǵ
|
45
|
-
"\u0414": "D"
|
46
|
-
"\u0402": "\u0110" # Đ
|
47
|
-
"\u0415": "E"
|
48
|
-
"\u0416": "\u005a\u030c" # Ž
|
49
|
-
"\u0417": "Z"
|
50
|
-
"\u0405": "Dz"
|
51
|
-
"\u0418": "I"
|
52
|
-
"\u0408": "J"
|
53
|
-
"\u041A": "K"
|
54
|
-
"\u040C": "\u1E30" # Ḱ
|
55
|
-
"\u041B": "L"
|
56
|
-
"\u0409": "Lj"
|
57
|
-
"\u041C": "M"
|
58
|
-
"\u041D": "N"
|
59
|
-
"\u040A": "Nj"
|
60
|
-
"\u041E": "O"
|
61
|
-
"\u041F": "P"
|
62
|
-
"\u0420": "R"
|
63
|
-
"\u0421": "S"
|
64
|
-
"\u0422": "T"
|
65
|
-
"\u0423": "U"
|
66
|
-
"\u0424": "F"
|
67
|
-
"\u0425": "H"
|
68
|
-
"\u0426": "C"
|
69
|
-
"\u0427": "\u0043\u030c" # Č
|
70
|
-
"\u040F": "D\u007a\u030c" # Dž
|
71
|
-
"\u0428": "\u0053\u030c" # Š
|
72
|
-
"\u0430": "a"
|
73
|
-
"\u0431": "b"
|
74
|
-
"\u0432": "v"
|
75
|
-
"\u0433": "g"
|
76
|
-
"\u0453": "\u01F5" # ǵ
|
77
|
-
"\u0434": "d"
|
78
|
-
"\u0452": "\u0111" # đ
|
79
|
-
"\u0435": "e"
|
80
|
-
"\u0436": "\u007a\u030c" # ž
|
81
|
-
"\u0437": "z"
|
82
|
-
"\u0455": "dz"
|
83
|
-
"\u0438": "i"
|
84
|
-
"\u0458": "j"
|
85
|
-
"\u043A": "k"
|
86
|
-
"\u045C": "\u1E31" # ḱ
|
87
|
-
"\u043B": "l"
|
88
|
-
"\u0459": "lj"
|
89
|
-
"\u043C": "m"
|
90
|
-
"\u043D": "n"
|
91
|
-
"\u045A": "nj"
|
92
|
-
"\u043E": "o"
|
93
|
-
"\u043F": "p"
|
94
|
-
"\u0440": "r"
|
95
|
-
"\u0441": "s"
|
96
|
-
"\u0442": "t"
|
97
|
-
"\u0443": "u"
|
98
|
-
"\u0444": "f"
|
99
|
-
"\u0445": "h"
|
100
|
-
"\u0446": "c"
|
101
|
-
"\u0447": "\u0063\u030c" # č
|
102
|
-
"\u045F": "d\u007a\u030c" # dž
|
103
|
-
"\u0448": "\u0073\u030c" # š
|