interscript 0.1.9 → 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +80 -135
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +73 -458
- data/README.adoc +0 -296
- data/aliases.json +0 -1
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -96
- data/lib/interscript/mapping.rb +0 -144
- data/lib/interscript/opal.rb +0 -196
- data/lib/interscript/opal/entrypoint.rb +0 -20
- data/lib/interscript/opal/exports.rb +0 -11
- data/lib/interscript/opal/maps.js.erb +0 -8
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
- data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
- data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
- data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
- data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
- data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
- data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
- data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
- data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
- data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
- data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
- data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
- data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -21
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -37
- data/spec/spec_helper.rb +0 -3
@@ -1,65 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 2011
|
4
|
-
language: iso-639-2:hin
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: Hindi Romanization, 2011
|
8
|
-
url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
|
9
|
-
creation_date: 1997
|
10
|
-
description: |
|
11
|
-
ALA-LC Romanization table for Hindi
|
12
|
-
|
13
|
-
notes:
|
14
|
-
|
15
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
-
made in transliteration.
|
18
|
-
|
19
|
-
- |
|
20
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
-
transliteration, with the following exceptions:
|
22
|
-
|
23
|
-
a) when another vowel is indicated by its appropriate sign; and
|
24
|
-
b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
|
25
|
-
virāma.
|
26
|
-
|
27
|
-
- |
|
28
|
-
Exception: Anusvāra is transliterated by:
|
29
|
-
|
30
|
-
a) ṅ before gutturals,
|
31
|
-
b) ñ before palatals,
|
32
|
-
c) ṇ before cerebrals,
|
33
|
-
d) n before dentals, and
|
34
|
-
e) m before labials.
|
35
|
-
|
36
|
-
- Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
|
37
|
-
labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
|
38
|
-
|
39
|
-
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
40
|
-
|
41
|
-
tests:
|
42
|
-
- source: "इस चुनौतीपूर्ण समय में 'वर्क फ्रॉम होम’ सामान्य बन चुका है"
|
43
|
-
expected: "is cunăutīpūrṇ samay meṃ 'vark phrôm homa’ sāmāny ban cukā hai"
|
44
|
-
- source: "दिल्ली में त्योहार पर खरीददारी करने निकले बड़ी संख्या में लोग, कई जगहों पर लगा भीषण जाम"
|
45
|
-
expected: "dillī meṃ tyohār par kharīdadārī karane nikale baṛī saṃkhyā meṃ loga, kaī jagahoṃ par lagā bhīshaṇ jāma"
|
46
|
-
- source: "सरकार ने पेंशन भोगियों को लाइफ सर्टिफिकेट जमा कराने के मामले में दी बड़ी राहत"
|
47
|
-
expected: "sarakār ne peṃśan bhogiyoṃ ko lāiph sarṭiphikeṭ jamā karāne ke māmale meṃ dī baṛī rāhata"
|
48
|
-
- source: "कांग्रेस ने माना उसके लचर प्रदर्शन ने डुबोई महागठबंधन की लुटिया, पार्टी में उठने लगी आत्ममंथन की आवाज"
|
49
|
-
expected: "kāṃgres ne mānā usake lacar pradarśan ne ḍuboī mahāgaṭhabandhan kī luṭiyā, pārṭī meṃ uṭhane lagī ātmamanthan kī āvāja"
|
50
|
-
- source: "डिजिटल पेमेंट सिस्टम ने छोटे-मध्यम कारोबारों का दिया साथ, कोरोना की परेशानियों को किया कम"
|
51
|
-
expected: "ḍijiṭal pemeṃṭ sisṭam ne choṭe-madhyam kārobāroṃ kā diyā sātha, koronā kī pareśāniyoṃ ko kiyā kama"
|
52
|
-
- source: "छोटे व्यापारियों को ढूंढें, उनसे खरीदें और उनका साथ दें"
|
53
|
-
expected: "choṭe vyāpāriyoṃ ko ḍhūṃḍheṃ, unase kharīdeṃ ăur unakā sāth deṃ"
|
54
|
-
- source: "भारत के साथ साझीदारी को महत्व देंगे बाइडन, ओबामा प्रशासन में रहीं वरिष्ठ अधिकारी एलिसा ने जताई उम्मीद"
|
55
|
-
expected: "bhārat ke sāth sājhīdārī ko mahatv deṃge bāiḍana, obāmā praśāsan meṃ rahīṃ varishṭh adhikārī elisā ne jatāī ummīda"
|
56
|
-
- source: "दो महीने से कोमा में था युवक, चिकन की चर्चा सुनते ही आया होश"
|
57
|
-
expected: "do mahīne se komā meṃ thā yuvaka, cikan kī carcā sunate hī āyā hośa"
|
58
|
-
- source: "कोरोना के टीके पर खुशखबरी, भारत पहुंची रूसी वैक्सीन की पहली खेप"
|
59
|
-
expected: "koronā ke ṭīke par khuśakhabarī, bhārat pahuṃcī rūsī vaiksīn kī pahalī khepa"
|
60
|
-
- source: "दिल्ली के गांधी नगर स्थित एक दुकान में लगी भीषण आग, दमकल की 20 गाड़ियां मौके पर"
|
61
|
-
expected: "dillī ke gāṃdhī nagar sthit ek dukān meṃ lagī bhīshaṇ āga, damakal kī 20 gāṛiyāṃ măuke para"
|
62
|
-
|
63
|
-
map:
|
64
|
-
|
65
|
-
inherit: "alalc-hin-Deva-Latn-1997"
|
@@ -1,274 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 1997
|
4
|
-
language: iso-639-2:kan
|
5
|
-
source_script: Kana
|
6
|
-
destination_script: Latn
|
7
|
-
name: Kannada Romanization, 1997
|
8
|
-
url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
|
9
|
-
creation_date: 1997
|
10
|
-
description: |
|
11
|
-
ALA-LC Romanization table for Kannada
|
12
|
-
|
13
|
-
notes:
|
14
|
-
|
15
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
-
made in transliteration.
|
18
|
-
|
19
|
-
- |
|
20
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
-
transliteration, with the following exceptions:
|
22
|
-
|
23
|
-
a) when another vowel is indicated by its appropriate sign; and
|
24
|
-
b) when the absence of any vowel is indicated by the superscript sign (◌್).
|
25
|
-
|
26
|
-
- |
|
27
|
-
Exception: Anusvāra is transliterated by:
|
28
|
-
|
29
|
-
a) ṅ before gutturals,
|
30
|
-
b) ñ before palatals,
|
31
|
-
c) ṇ before cerebrals,
|
32
|
-
d) n before dentals, and
|
33
|
-
e) m before labials.
|
34
|
-
|
35
|
-
|
36
|
-
tests:
|
37
|
-
- source: "ಕರ್ಣಾಟಕ"
|
38
|
-
expected: "karṇāṭaka"
|
39
|
-
- source: "ಬೆಂಗಳೂರು"
|
40
|
-
expected: "beṅgaḷūru"
|
41
|
-
- source: "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ"
|
42
|
-
expected: "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
|
43
|
-
- source: "ದೇವರ ಹೆಸರು ಬಳಸಿ ಆನ್ಲೈನ್ ಬೆಟ್ಟಿಂಗ್!"
|
44
|
-
expected: "dēvara hesaru baḷasi ānlain beṭṭiṃg!"
|
45
|
-
- source: "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ"
|
46
|
-
expected: "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
|
47
|
-
- source: "ಸ್ವಾಮಿತ್ವ: ಹೊಸ ಯೋಜನೆಯಿಂದ ನಮಗೆ ಏನು ಲಾಭ ?"
|
48
|
-
expected: "svāmitva: hosa yōjaneyinda namage ēnu lābha ?"
|
49
|
-
- source: "ಮರಳು ಸಾಗಾಣಿಕೆ ವ್ಯವಹಾರ ಆಗಬಾರದು :ಅಧಿಕಾರಿಗಳಿಗೆ ಖಡಕ್ ಸೂಚನೆ ನೀಡಿದ ಜಿಲ್ಲಾಧಿಕಾರಿ"
|
50
|
-
expected: "maraḷu sāgāṇike vyavahāra āgabāradu :adhikārigaḷige khaḍak sūcane nīḍida jillādhikāri"
|
51
|
-
- source: "ಹಾವೇರಿ ಜಿಲ್ಲೆಯಲ್ಲಿ ೯೭ ಜನರಲ್ಲಿ ಕೋವಿಡ್ ಸೋಂಕು ಪತ್ತೆ ; 54 ಮಂದಿ ಗುಣಮುಖ"
|
52
|
-
expected: "hāvēri jilleyalli 97 janaralli kōviḍ sōṃku patte ; 54 maṃdi guṇamukha"
|
53
|
-
- source: "ಸಿಂದಗಿ ಐಸಿಐಸಿಐ ಬ್ಯಾಂಕ್ ಸೆಕ್ಯುರಿಟಿ ಗಾರ್ಡ್ ಹತ್ಯೆ ಪ್ರಕರಣ ಭೇದಿಸಿದ ಪೊಲೀಸರು"
|
54
|
-
expected: "sindagi aisiaisiai byāṃk sekyuriṭi gārḍ hatye prakaraṇa bhēdisida polīsaru"
|
55
|
-
- source: "ಬ್ಯಾಂಕರ್ಗಳೊಂದಿಗೆ ಡಿವಿ ಸಭೆ : ಆಧ್ಯತಾ ವಲಯ, ಸಾಲ ಯೋಜನೆ ತ್ವರಿತ ಮಂಜೂರಿಗೆ ಸೂಚನೆ"
|
56
|
-
expected: "byāṅkargaḷoṃdige ḍivi sabhe : ādhyatā valaya, sāla yōjane tvarita maṃjūrige sūcane"
|
57
|
-
- source: "ಪೊಲೀಸ್ ಇಲಾಖೆ ಸಮಗ್ರ ಅಭಿವೃದ್ಧಿ; ಡಿಜಿಪಿ ನೇತೃತ್ವದಲ್ಲಿ ಸಮಿತಿ ರಚನೆ: ಬೊಮ್ಮಾಯಿ"
|
58
|
-
expected: "polīs ilākhe samagra abhivṛddhi; ḍijipi nētṛtvadalli samiti racane: beūmmāyi"
|
59
|
-
- source: "ಕೆಟ್ಟಿರುವ ರಸ್ತೆಗಳ ದುರಸ್ತಿಗೆ ಸರಕಾರದ ಯೋಜನೆ"
|
60
|
-
expected: "keṭṭiruva rastegaḷa durastige sarakārada yōjane"
|
61
|
-
|
62
|
-
map:
|
63
|
-
|
64
|
-
|
65
|
-
rules:
|
66
|
-
# to cover diacritic and vowel less consonants rule II
|
67
|
-
- pattern: ([ಕ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
68
|
-
result: 'k'
|
69
|
-
- pattern: ([ಖ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
70
|
-
result: 'kh'
|
71
|
-
- pattern: ([ಗ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
72
|
-
result: 'g'
|
73
|
-
- pattern: ([ಘ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
74
|
-
result: 'gh'
|
75
|
-
- pattern: ([ಙ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
76
|
-
result: 'ṅ'
|
77
|
-
- pattern: ([ಚ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
78
|
-
result: 'c'
|
79
|
-
- pattern: ([ಛ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
80
|
-
result: 'ch'
|
81
|
-
- pattern: ([ಜ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
82
|
-
result: 'j'
|
83
|
-
- pattern: ([ಝ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
84
|
-
result: 'jh'
|
85
|
-
- pattern: ([ಞ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
86
|
-
result: 'ñ'
|
87
|
-
- pattern: ([ಟ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
88
|
-
result: 'ṭ'
|
89
|
-
- pattern: ([ಠ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
90
|
-
result: 'ṭh'
|
91
|
-
- pattern: ([ಡ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
92
|
-
result: 'ḍ'
|
93
|
-
- pattern: ([ಢ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
94
|
-
result: 'ḍh'
|
95
|
-
- pattern: ([ಣ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
96
|
-
result: 'ṇ'
|
97
|
-
- pattern: ([ತ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
98
|
-
result: 't'
|
99
|
-
- pattern: ([ಥ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
100
|
-
result: 'th'
|
101
|
-
- pattern: ([ದ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
102
|
-
result: 'd'
|
103
|
-
- pattern: ([ಧ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
104
|
-
result: 'dh'
|
105
|
-
- pattern: ([ನ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
106
|
-
result: 'n'
|
107
|
-
- pattern: ([ಪ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
108
|
-
result: 'p'
|
109
|
-
- pattern: ([ಫ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
110
|
-
result: 'ph'
|
111
|
-
- pattern: ([ಬ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
112
|
-
result: 'b'
|
113
|
-
- pattern: ([ಭ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
114
|
-
result: 'bh'
|
115
|
-
- pattern: ([ಮ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
116
|
-
result: 'm'
|
117
|
-
- pattern: ([ಯ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
118
|
-
result: 'y'
|
119
|
-
- pattern: ([ರ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
120
|
-
result: 'r'
|
121
|
-
- pattern: ([ಱ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
122
|
-
result: 'ṟ'
|
123
|
-
- pattern: ([ಲ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
124
|
-
result: 'l'
|
125
|
-
- pattern: ([ಳ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
126
|
-
result: 'ḷ'
|
127
|
-
- pattern: ([ೞ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
128
|
-
result: 'l̤'
|
129
|
-
- pattern: ([ವ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
130
|
-
result: 'v'
|
131
|
-
- pattern: ([ಶ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
132
|
-
result: 'ś'
|
133
|
-
- pattern: ([ಷ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
134
|
-
result: 'ṣ'
|
135
|
-
- pattern: ([ಸ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
136
|
-
result: 's'
|
137
|
-
- pattern: ([ಹ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
138
|
-
result: 'h'
|
139
|
-
|
140
|
-
# rule[III]
|
141
|
-
- pattern: \u0C82(?=[ಕಖಗಘಙ])
|
142
|
-
result: ṅ
|
143
|
-
- pattern: \u0C82(?=[ಚಛಜಝಞ])
|
144
|
-
result: ñ
|
145
|
-
- pattern: \u0C82(?=[ಟಠಡಢಣ])
|
146
|
-
result: ṇ
|
147
|
-
- pattern: \u0C82(?=[ತಥದಧನ])
|
148
|
-
result: n
|
149
|
-
|
150
|
-
characters:
|
151
|
-
'ಅ': 'a'
|
152
|
-
'ಆ': 'ā'
|
153
|
-
'ಇ': 'i'
|
154
|
-
'ಈ': 'ī'
|
155
|
-
'ಉ': 'u'
|
156
|
-
'ಊ': 'ū'
|
157
|
-
'ಋ': 'ṛ'
|
158
|
-
'ೠ': 'ṝ'
|
159
|
-
|
160
|
-
'ಌ': 'ḻ'
|
161
|
-
|
162
|
-
'ಎ': 'e'
|
163
|
-
'ಏ': 'ē'
|
164
|
-
'ಐ': 'ai'
|
165
|
-
|
166
|
-
'ಒ': 'o'
|
167
|
-
'ಓ': 'ō'
|
168
|
-
'ಔ': 'au'
|
169
|
-
|
170
|
-
# Gutturals
|
171
|
-
'ಕ': 'ka'
|
172
|
-
'ಖ': 'kha'
|
173
|
-
'ಗ': 'ga'
|
174
|
-
'ಘ': 'gha'
|
175
|
-
'ಙ': 'ṅa'
|
176
|
-
|
177
|
-
# Palatals
|
178
|
-
'ಚ': 'ca'
|
179
|
-
'ಛ': 'cha'
|
180
|
-
'ಜ': 'ja'
|
181
|
-
'ಝ': 'jha'
|
182
|
-
'ಞ': 'ña'
|
183
|
-
|
184
|
-
# Cerebrals
|
185
|
-
'ಟ': 'ṭa'
|
186
|
-
'ಠ': 'ṭha'
|
187
|
-
'ಡ': 'ḍa'
|
188
|
-
'ಢ': 'ḍha'
|
189
|
-
'ಣ': 'ṇa'
|
190
|
-
|
191
|
-
# Dentals
|
192
|
-
'ತ': 'ta'
|
193
|
-
'ಥ': 'tha'
|
194
|
-
'ದ': 'da'
|
195
|
-
'ಧ': 'dha'
|
196
|
-
'ನ': 'na'
|
197
|
-
|
198
|
-
# Labials
|
199
|
-
'ಪ': 'pa'
|
200
|
-
'ಫ': 'pha'
|
201
|
-
'ಬ': 'ba'
|
202
|
-
'ಭ': 'bha'
|
203
|
-
'ಮ': 'ma'
|
204
|
-
|
205
|
-
# Semivowels
|
206
|
-
'ಯ': 'ya'
|
207
|
-
'ರ': 'ra'
|
208
|
-
'ಱ': 'ṟa'
|
209
|
-
'ಲ': 'la'
|
210
|
-
'ಳ': 'ḷa'
|
211
|
-
'ೞ': 'l̤a'
|
212
|
-
|
213
|
-
|
214
|
-
'ವ': 'va'
|
215
|
-
|
216
|
-
# Sibilants
|
217
|
-
'ಶ': 'śa'
|
218
|
-
'ಷ': 'ṣa'
|
219
|
-
'ಸ': 'sa'
|
220
|
-
|
221
|
-
|
222
|
-
# Aspirate
|
223
|
-
'ಹ': 'ha'
|
224
|
-
|
225
|
-
|
226
|
-
# Bisarga
|
227
|
-
'ಃ': 'ḥ'
|
228
|
-
|
229
|
-
# Anusvāra
|
230
|
-
'ಂ': 'ṃ'
|
231
|
-
|
232
|
-
'\u0cbc': '' #nukta
|
233
|
-
|
234
|
-
# Medials # Needed for connecting constants
|
235
|
-
'ಾ': "ā"
|
236
|
-
'ಿ': "i"
|
237
|
-
'ೀ': "ī"
|
238
|
-
'ು': "u"
|
239
|
-
'ೂ': "ū"
|
240
|
-
'ೃ': "ṛ"
|
241
|
-
'ೄ': "ṝ"
|
242
|
-
'\u0CE2': 'ḻ' # KANNADA VOWEL SIGN VOCALIC L ( ೢ)
|
243
|
-
|
244
|
-
|
245
|
-
'ೆ': "e"
|
246
|
-
'ೇ': "ē"
|
247
|
-
'ೈ': "ai"
|
248
|
-
|
249
|
-
|
250
|
-
'ೊ': 'o'
|
251
|
-
'ೋ': 'ō'
|
252
|
-
'ೌ': 'au'
|
253
|
-
|
254
|
-
|
255
|
-
'्': ''
|
256
|
-
'़': ''
|
257
|
-
'್': '' # used for pronounciation without vowel
|
258
|
-
"": '' # no need for zero with joiner
|
259
|
-
"": '' # no need for zero with non joiner
|
260
|
-
|
261
|
-
|
262
|
-
|
263
|
-
# Digits
|
264
|
-
|
265
|
-
'೦': '0'
|
266
|
-
'೧': '1'
|
267
|
-
'೨': '2'
|
268
|
-
'೩': '3'
|
269
|
-
'೪': '4'
|
270
|
-
'೫': '5'
|
271
|
-
'೬': '6'
|
272
|
-
'೭': '7'
|
273
|
-
'೮': '8'
|
274
|
-
'೯': '9'
|
@@ -1,63 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 2011
|
4
|
-
language: iso-639-2:kan
|
5
|
-
source_script: Kana
|
6
|
-
destination_script: Latn
|
7
|
-
name: Kannada Romanization, 2011
|
8
|
-
url: http://catdir.loc.gov/catdir/cpso/romanization/kannada.pdf
|
9
|
-
creation_date: 2011
|
10
|
-
description: |
|
11
|
-
ALA-LC Romanization table for Kannada
|
12
|
-
|
13
|
-
notes:
|
14
|
-
|
15
|
-
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
16
|
-
vowels following a consonant can be found in grammars; no distinction between the two is
|
17
|
-
made in transliteration.
|
18
|
-
|
19
|
-
- |
|
20
|
-
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
21
|
-
transliteration, with the following exceptions:
|
22
|
-
|
23
|
-
a) when another vowel is indicated by its appropriate sign; and
|
24
|
-
b) when the absence of any vowel is indicated by the superscript sign (◌್).
|
25
|
-
|
26
|
-
- |
|
27
|
-
Exception: Anusvāra is transliterated by:
|
28
|
-
|
29
|
-
a) ṅ before gutturals,
|
30
|
-
b) ñ before palatals,
|
31
|
-
c) ṇ before cerebrals,
|
32
|
-
d) n before dentals, and
|
33
|
-
e) m before labials.
|
34
|
-
|
35
|
-
|
36
|
-
tests:
|
37
|
-
- source: "ಕರ್ಣಾಟಕ"
|
38
|
-
expected: "karṇāṭaka"
|
39
|
-
- source: "ಬೆಂಗಳೂರು"
|
40
|
-
expected: "beṅgaḷūru"
|
41
|
-
- source: "ಭಾರತದಲ್ಲಿ ಗಾಳಿ ಕಲುಷಿತವಾಗಿದೆ: ಹವಾಮಾನ ಬದಲಾವಣೆ ಸಮರ್ಥನೆಗೆ ಭಾರತವನ್ನು ಟೀಕಿಸಿದ ಟ್ರಂಪ್"
|
42
|
-
expected: "bhāratadalli gāḷi kaluṣitavāgide: havāmāna badalāvaṇe samarthanege bhāratavannu ṭīkisida ṭraṃp"
|
43
|
-
- source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?!"
|
44
|
-
expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?!"
|
45
|
-
- source: "ಹೇಗಿದೆ ಅಮೆರಿಕನ್ ಚುನಾವಣ ಕಣ?"
|
46
|
-
expected: "hēgide amerikan cunāvaṇa kaṇa?"
|
47
|
-
- source: "ಫ್ರೀಜರ್ ನಲ್ಲಿಟ್ಟ ನೂಡಲ್ಸ್ ತಿಂದು ಒಂದೇ ಕುಟುಂಬದ ೯ ಮಂದಿ ಸಾವು: ೩ ಮಕ್ಕಳು ಅಪಾಯದಿಂದ ಪಾರು"
|
48
|
-
expected: "phrījar nalliṭṭa nūḍals tiṃdu oṃdē kuṭuṃbada 9 maṃdi sāvu: 3 makkaḷu apāyadinda pāru"
|
49
|
-
- source: "ಉಡುಪಿಯಲ್ಲಿ ಪ್ರಪ್ರಥಮ ಬಾರಿಗೆ ಪ್ರಾರಂಭವಾಗಿರುವ ದೇಶಿ ಉತ್ಪನ್ನಗಳ ಮಳಿಗೆ"
|
50
|
-
expected: "uḍupiyalli praprathama bārige prāraṃbhavāgiruva dēśi utpannagaḷa maḷige"
|
51
|
-
- source: "ಚಿಕ್ಕಮಗಳೂರು : ಪುಷ್ಪ ಸಮರ್ಪಣೆ ವೇಳೆ ಮಗಳನ್ನ ನೆನೆದು ಕಣ್ಣೀರಿಟ್ಟ ಮೃತ ಪೇದೆ ತಾಯಿ"
|
52
|
-
expected: "cikkamagaḷūru : puṣpa samarpaṇe vēḷe magaḷanna nenedu kaṇṇīriṭṭa mṛta pēde tāyi"
|
53
|
-
- source: "ಸಮಂಗಳೂರು: ಡ್ರಗ್ಸ್ ಜಾಗೃತಿ ಬರಹದಿಂದ ಗಮನಸೆಳೆಯುತ್ತಿದೆ ಸಿಟಿ ಬಸ್"
|
54
|
-
expected: "samaṅgaḷūru: ḍrags jāgṛti barahadinda gamanaseḷeyuttide siṭi bas"
|
55
|
-
- source: "ಪುರಸಭೆ, ಪಪಂ ಅಧ್ಯಕ್ಷ-ಉಪಾಧ್ಯಕ್ಷ ಚುನಾವಣೆಗೆ ಹೈಕೋರ್ಟ್ ಅಸ್ತು"
|
56
|
-
expected: "purasabhe, papaṃ adhyakṣa-upādhyakṣa cunāvaṇege haikōrṭ astu"
|
57
|
-
- source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ ಅಂತಿಮ ಚರ್ಚೆ: ಭಾರತದ ವಿರುದ್ಧ ಟ್ರಂಪ್ ಆರೋಪವೇನು?"
|
58
|
-
expected: "amerika adhyakṣīya cunāvaṇe aṃtima carce: bhāratada viruddha ṭraṃp ārōpavēnu?"
|
59
|
-
- source: "ಮನೆ ಕುಸಿದು ತಂದೆ ಮತ್ತು ಮಗ ಸಾವು, ಇನ್ನಿಬ್ಬರಿಗೆ ಗಾಯ: ಸ್ಥಳಕ್ಕೆ ಶಾಸಕರ ಭೇಟಿ"
|
60
|
-
expected: "mane kusidu taṃde mattu maga sāvu, innibbarige gāya: sthaḷakke śāsakara bhēṭi"
|
61
|
-
|
62
|
-
map:
|
63
|
-
inherit: 'alalc-kan-Kana-Latn-1997'
|
@@ -1,111 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: alalc
|
3
|
-
id: 1997
|
4
|
-
language: iso-639-2:kat
|
5
|
-
source_script: Geok
|
6
|
-
destination_script: Latn
|
7
|
-
name: ALA-LC Georgian System (1997)
|
8
|
-
url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
|
9
|
-
creation_date: 1997
|
10
|
-
confirmation_date: 1997
|
11
|
-
description: |
|
12
|
-
Values are shown for the Khutsuri alphabet.
|
13
|
-
|
14
|
-
notes:
|
15
|
-
|
16
|
-
tests:
|
17
|
-
|
18
|
-
- source: ႼႨႢႬႨ
|
19
|
-
expected: CIGNI
|
20
|
-
|
21
|
-
- source: ⴜⴈⴂⴌⴈ
|
22
|
-
expected: cigni
|
23
|
-
|
24
|
-
- source: ႱႭႪႭႫႭႬ
|
25
|
-
expected: SOLOMON
|
26
|
-
|
27
|
-
- source: ⴑⴍⴊⴍⴋⴍⴌ
|
28
|
-
expected: solomon
|
29
|
-
|
30
|
-
- source: ႠႡႰႠჀႠႫ
|
31
|
-
expected: ABRAHAM
|
32
|
-
|
33
|
-
map:
|
34
|
-
characters:
|
35
|
-
'\u10a0' : 'A' # Ⴀ
|
36
|
-
'\u10a1' : 'B' # Ⴁ
|
37
|
-
'\u10a2' : 'G' # Ⴂ
|
38
|
-
'\u10a3' : 'D' # Ⴃ
|
39
|
-
'\u10a4' : 'E' # Ⴄ
|
40
|
-
'\u10a5' : 'V' # Ⴅ
|
41
|
-
'\u10a6' : 'Z' # Ⴆ
|
42
|
-
'\u10a7' : 'Tʻ' # Ⴇ
|
43
|
-
'\u10a8' : 'I' # Ⴈ
|
44
|
-
'\u10a9' : 'K' # Ⴉ
|
45
|
-
'\u10aa' : 'L' # Ⴊ
|
46
|
-
'\u10ab' : 'M' # Ⴋ
|
47
|
-
'\u10ac' : 'N' # Ⴌ
|
48
|
-
'\u10ad' : 'O' # Ⴍ
|
49
|
-
'\u10ae' : 'P' # Ⴎ
|
50
|
-
'\u10af' : 'Ž' # Ⴏ
|
51
|
-
'\u10b0' : 'R' # Ⴐ
|
52
|
-
'\u10b1' : 'S' # Ⴑ
|
53
|
-
'\u10b2' : 'T' # Ⴒ
|
54
|
-
'\u10b3' : 'U' # Ⴓ
|
55
|
-
'\u10b4' : 'Pʻ' # Ⴔ
|
56
|
-
'\u10b5' : 'Kʻ' # Ⴕ
|
57
|
-
'\u10b6' : 'Ġ' # Ⴖ
|
58
|
-
'\u10b7' : 'Q' # Ⴗ
|
59
|
-
'\u10b8' : 'Š' # Ⴘ
|
60
|
-
'\u10b9' : 'Čʻ' # Ⴙ
|
61
|
-
'\u10ba' : 'Cʻ' # Ⴚ
|
62
|
-
'\u10bb' : 'Ż' # Ⴛ
|
63
|
-
'\u10bc' : 'C' # Ⴜ
|
64
|
-
'\u10bd' : 'Č' # Ⴝ
|
65
|
-
'\u10be' : 'X' # Ⴞ
|
66
|
-
'\u10bf' : 'J' # Ⴟ
|
67
|
-
'\u10c0' : 'H' # Ⴠ
|
68
|
-
'\u10c1' : 'Ē' # Ⴡ
|
69
|
-
'\u10c2' : 'Y' # Ⴢ
|
70
|
-
'\u10c3' : 'W' # Ⴣ
|
71
|
-
'\u10c4' : 'X̣' # Ⴤ
|
72
|
-
'\u10c5' : 'Ō' # Ⴥ
|
73
|
-
|
74
|
-
'\u2d00' : 'a' # ⴀ
|
75
|
-
'\u2d01' : 'b' # ⴁ
|
76
|
-
'\u2d02' : 'g' # ⴂ
|
77
|
-
'\u2d03' : 'd' # ⴃ
|
78
|
-
'\u2d04' : 'e' # ⴄ
|
79
|
-
'\u2d05' : 'v' # ⴅ
|
80
|
-
'\u2d06' : 'z' # ⴆ
|
81
|
-
'\u2d07' : 'tʻ' # ⴇ
|
82
|
-
'\u2d08' : 'i' # ⴈ
|
83
|
-
'\u2d09' : 'k' # ⴉ
|
84
|
-
'\u2d0a' : 'l' # ⴊ
|
85
|
-
'\u2d0b' : 'm' # ⴋ
|
86
|
-
'\u2d0c' : 'n' # ⴌ
|
87
|
-
'\u2d0d' : 'o' # ⴍ
|
88
|
-
'\u2d0e' : 'p' # ⴎ
|
89
|
-
'\u2d0f' : 'ž' # ⴏ
|
90
|
-
'\u2d10' : 'r' # ⴐ
|
91
|
-
'\u2d11' : 's' # ⴑ
|
92
|
-
'\u2d12' : 't' # ⴒ
|
93
|
-
'\u2d13' : 'u' # ⴓ
|
94
|
-
'\u2d14' : 'pʻ' # ⴔ
|
95
|
-
'\u2d15' : 'kʻ' # ⴕ
|
96
|
-
'\u2d16' : 'ġ' # ⴖ
|
97
|
-
'\u2d17' : 'q' # ⴗ
|
98
|
-
'\u2d18' : 'š' # ⴘ
|
99
|
-
'\u2d19' : 'čʻ' # ⴙ
|
100
|
-
'\u2d1a' : 'cʻ' # ⴚ
|
101
|
-
'\u2d1b' : 'ż' # ⴛ
|
102
|
-
'\u2d1c' : 'c' # ⴜ
|
103
|
-
'\u2d1d' : 'č' # ⴝ
|
104
|
-
'\u2d1e' : 'x' # ⴞ
|
105
|
-
'\u2d1f' : 'j' # ⴟ
|
106
|
-
'\u2d20' : 'h' # ⴠ
|
107
|
-
'\u2d21' : 'ē' # ⴡ
|
108
|
-
'\u2d22' : 'y' # ⴢ
|
109
|
-
'\u2d23' : 'w' # ⴣ
|
110
|
-
'\u2d24' : 'x̣' # ⴤ
|
111
|
-
'\u2d25' : 'ō' # ⴥ
|