interscript 0.1.9 → 2.0.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +80 -135
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +73 -458
- data/README.adoc +0 -296
- data/aliases.json +0 -1
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -96
- data/lib/interscript/mapping.rb +0 -144
- data/lib/interscript/opal.rb +0 -196
- data/lib/interscript/opal/entrypoint.rb +0 -20
- data/lib/interscript/opal/exports.rb +0 -11
- data/lib/interscript/opal/maps.js.erb +0 -8
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
- data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
- data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
- data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
- data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
- data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
- data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
- data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
- data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
- data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
- data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
- data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
- data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -21
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -37
- data/spec/spec_helper.rb +0 -3
@@ -1,254 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: ungegn
|
3
|
-
id: 2016
|
4
|
-
language: iso-639-2:kan
|
5
|
-
source_script: Kana
|
6
|
-
destination_script: Latn
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Kannada Romanization, 1972
|
8
|
-
url: https://www.eki.ee/wgrs/rom1_kn.pdf
|
9
|
-
creation_date: 1972
|
10
|
-
confirmation_date: 2016
|
11
|
-
description: |
|
12
|
-
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
|
13
|
-
(III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
|
14
|
-
published in volume II of the conference reports
|
15
|
-
|
16
|
-
There is no evidence of the use of the system either in India or in international cartographic
|
17
|
-
products.
|
18
|
-
|
19
|
-
Kannada uses an alphasyllabic script whereby each character represents a syllable rather than
|
20
|
-
one sound. Vowels and diphthongs are marked in two ways: as independent characters (used
|
21
|
-
syllable-initially) and in an abbreviated form, to denote vowels after consonants. The
|
22
|
-
romanization table is unambiguous. The system is mostly reversible but there may exist some
|
23
|
-
ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
|
24
|
-
consonants (combinations with subscript consonants vs. character sequences).
|
25
|
-
|
26
|
-
notes:
|
27
|
-
- |
|
28
|
-
While most consonants have a diacritic in the upper right corner of the character (like ಕ),
|
29
|
-
some do not, e.g. ಖ kha, ಜ ja, ನ na, ಬ ba, ಲ la.
|
30
|
-
- |
|
31
|
-
Combinations with r as the first component are written by adding a special symbol after the
|
32
|
-
second consonant: ರ್ಗ rga.
|
33
|
-
|
34
|
-
|
35
|
-
tests:
|
36
|
-
- source: "ಕರ್ಣಾಟಕ"
|
37
|
-
expected: "karṇāṭaka"
|
38
|
-
- source: "ಬೆಂಗಳೂರು"
|
39
|
-
expected: "bĕṁgaḷūru"
|
40
|
-
- source: "ಮಹಾರಾಷ್ಟ್ರದ ಯಾವುದೇ ಪ್ರಕರಣದ ತನಿಖೆಗೆ ಇನ್ನು ಸಿಬಿಐ ಪಡೆಯಬೇಕು ಅನುಮತಿ"
|
41
|
-
expected: "mahārāṣhṭrada yāvude prakaraṇada tanikhĕgĕ innu sibiai paḍĕyabeku anumati"
|
42
|
-
- source: "ಹರಕು ಬಾಯಿ: ಈಶ್ವರಪ್ಪಗೆ ಶಾಸಕ ಯತ್ನಾಳ ತಿರುಗೇಟು"
|
43
|
-
expected: "haraku bāyi: īshvarappagĕ shāsaka yatnāḷa tirugeṭu"
|
44
|
-
- source: "ಹಾಥರಸ್ ಪ್ರಕರಣ: ೨೯ರಂದು ರಾಷ್ಟ್ರವ್ಯಾಪಿ ಪ್ರತಿಭಟನೆಗೆ ಮಹಿಳಾ ಸಂಘಟನೆಗಳ ಕರೆ"
|
45
|
-
expected: "hātharas prakaraṇa: 29raṁdu rāṣhṭravyāpi pratibhaṭanĕgĕ mahiḷā saṁghaṭanĕgaḷa karĕ"
|
46
|
-
- source: "ಪೊಲೀಸ್ ಮಕ್ಕಳ ಶಾಲೆ ಮುಚ್ಚುವ ಯತ್ನಕ್ಕೆ ಹೊರಟ್ಟಿ ತೀವ್ರ ವಿರೋಧ"
|
47
|
-
expected: "pŏlīs makkaḷa shālĕ muchchuva yatnakkĕ hŏraṭṭi tīvra virodha"
|
48
|
-
- source: "ಅಮೆರಿಕ ಅಧ್ಯಕ್ಷೀಯ ಚುನಾವಣೆ: ಟ್ರಂಪ್–ಬೈಡನ್ ಅಂತಿಮ ಮುಖಾಮುಖಿಗೆ ವೇದಿಕೆ ಸಿದ್ಧ"
|
49
|
-
expected: "amĕrika adhyakṣhīya chunāvaṇĕ: ṭraṁp–baiḍan aṁtima mukhāmukhigĕ vedikĕ siddha"
|
50
|
-
- source: "ಅಂಜನಾದ್ರಿ ಆಂಜನೇಯನ ದರ್ಶನ ಪಡೆದ ಪವರ್ ಸ್ಟಾರ್ ಪುನೀತ್ ರಾಜ್ ಕುಮಾರ್"
|
51
|
-
expected: "aṁjanādri āṁjaneyana darshana paḍĕda pavar sṭār punīt rāj kumār"
|
52
|
-
- source: "ಇನ್ನು ಹಿಂದೂ ದೇವಸ್ಥಾನದ ಧಾರ್ಮಿಕ ಕಾರ್ಯದಲ್ಲಿ ಭಾಗಿಯಾಗಿದ್ದಕ್ಕೆ ಮೋಯಿದ್ದೀನ್ ಬಾವಾಗೆ ಬೆದರಿಕೆ ಒಡ್ಡಲಾಗಿದೆ"
|
53
|
-
expected: "innu hiṁdū devasthānada dhārmika kāryadalli bhāgiyāgiddakkĕ moyiddīn bāvāgĕ bĕdarikĕ ŏḍḍalāgidĕ"
|
54
|
-
- source: "ಇದು ಮೋದಿ ದೇಶ - ದನ ತಿಂದು ಹೋದ್ರೆ ಹುಷಾರ್ : ದೇಗುಲಕ್ಕೆ ಹೋಗಿದ್ದ ಬಾವಾಗೆ ಬೆದರಿಕೆ"
|
55
|
-
expected: "idu modi desha - dana tiṁdu hodrĕ huṣhār : degulakkĕ hogidda bāvāgĕ bĕdarikĕ"
|
56
|
-
|
57
|
-
map:
|
58
|
-
|
59
|
-
rules:
|
60
|
-
# to cover diacritic and vowel less consonants
|
61
|
-
- pattern: ([ಕ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
62
|
-
result: 'k'
|
63
|
-
- pattern: ([ಖ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
64
|
-
result: 'kh'
|
65
|
-
- pattern: ([ಗ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
66
|
-
result: 'g'
|
67
|
-
- pattern: ([ಘ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
68
|
-
result: 'gh'
|
69
|
-
- pattern: ([ಙ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
70
|
-
result: 'ṅ'
|
71
|
-
- pattern: ([ಚ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
72
|
-
result: 'ch'
|
73
|
-
- pattern: ([ಛ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
74
|
-
result: 'chh'
|
75
|
-
- pattern: ([ಜ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
76
|
-
result: 'j'
|
77
|
-
- pattern: ([ಝ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
78
|
-
result: 'jh'
|
79
|
-
- pattern: ([ಞ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
80
|
-
result: 'ñ'
|
81
|
-
- pattern: ([ಟ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
82
|
-
result: 'ṭ'
|
83
|
-
- pattern: ([ಠ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
84
|
-
result: 'ṭh'
|
85
|
-
- pattern: ([ಡ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
86
|
-
result: 'ḍ'
|
87
|
-
- pattern: ([ಢ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
88
|
-
result: 'ḍh'
|
89
|
-
- pattern: ([ಣ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
90
|
-
result: 'ṇ'
|
91
|
-
- pattern: ([ತ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
92
|
-
result: 't'
|
93
|
-
- pattern: ([ಥ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
94
|
-
result: 'th'
|
95
|
-
- pattern: ([ದ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
96
|
-
result: 'd'
|
97
|
-
- pattern: ([ಧ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
98
|
-
result: 'dh'
|
99
|
-
- pattern: ([ನ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
100
|
-
result: 'n'
|
101
|
-
- pattern: ([ಪ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
102
|
-
result: 'p'
|
103
|
-
- pattern: ([ಫ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
104
|
-
result: 'ph'
|
105
|
-
- pattern: ([ಬ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
106
|
-
result: 'b'
|
107
|
-
- pattern: ([ಭ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
108
|
-
result: 'bh'
|
109
|
-
- pattern: ([ಮ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
110
|
-
result: 'm'
|
111
|
-
- pattern: ([ಯ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
112
|
-
result: 'y'
|
113
|
-
- pattern: ([ರ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
114
|
-
result: 'r'
|
115
|
-
- pattern: ([ಲ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
116
|
-
result: 'l'
|
117
|
-
- pattern: ([ಳ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
118
|
-
result: 'ḷ'
|
119
|
-
- pattern: ([ವ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
120
|
-
result: 'v'
|
121
|
-
- pattern: ([ಶ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
122
|
-
result: 'sh'
|
123
|
-
- pattern: ([ಷ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
124
|
-
result: 'ṣh'
|
125
|
-
- pattern: ([ಸ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
126
|
-
result: 's'
|
127
|
-
- pattern: ([ಹ]=?)(?=[\u0cbe\u0cbf\u0cc0\u0cc1\u0cc2\u0cc3\u0cc6\u0cc7\u0cc8\u0cca\u0ccb\u0ccc\u0ccd])
|
128
|
-
result: 'h'
|
129
|
-
|
130
|
-
characters:
|
131
|
-
'ಅ': 'a'
|
132
|
-
'ಆ': 'ā'
|
133
|
-
'ಇ': 'i'
|
134
|
-
'ಈ': 'ī'
|
135
|
-
'ಉ': 'u'
|
136
|
-
'ಊ': 'ū'
|
137
|
-
'ಋ': 'ṛ'
|
138
|
-
|
139
|
-
'ಎ': 'ĕ'
|
140
|
-
'ಏ': 'e'
|
141
|
-
'ಐ': 'ai'
|
142
|
-
|
143
|
-
'ಒ': 'ŏ'
|
144
|
-
'ಓ': 'o'
|
145
|
-
'ಔ': 'au'
|
146
|
-
|
147
|
-
# Gutturals
|
148
|
-
'ಕ': 'ka'
|
149
|
-
'ಖ': 'kha'
|
150
|
-
'ಗ': 'ga'
|
151
|
-
'ಘ': 'gha'
|
152
|
-
'ಙ': 'ṅa'
|
153
|
-
|
154
|
-
# Palatals
|
155
|
-
'ಚ': 'cha'
|
156
|
-
'ಛ': 'chha'
|
157
|
-
'ಜ': 'ja'
|
158
|
-
'ಝ': 'jha'
|
159
|
-
'ಞ': 'ña'
|
160
|
-
|
161
|
-
# Cerebrals
|
162
|
-
'ಟ': 'ṭa'
|
163
|
-
'ಠ': 'ṭha'
|
164
|
-
'ಡ': 'ḍa'
|
165
|
-
'ಢ': 'ḍha'
|
166
|
-
'ಣ': 'ṇa'
|
167
|
-
|
168
|
-
# Dentals
|
169
|
-
'ತ': 'ta'
|
170
|
-
'ಥ': 'tha'
|
171
|
-
'ದ': 'da'
|
172
|
-
'ಧ': 'dha'
|
173
|
-
'ನ': 'na'
|
174
|
-
|
175
|
-
# Labials
|
176
|
-
'ಪ': 'pa'
|
177
|
-
'ಫ': 'pha'
|
178
|
-
'ಬ': 'ba'
|
179
|
-
'ಭ': 'bha'
|
180
|
-
'ಮ': 'ma'
|
181
|
-
|
182
|
-
# Semivowels
|
183
|
-
'ಯ': 'ya'
|
184
|
-
'ರ': 'ra'
|
185
|
-
'ಲ': 'la'
|
186
|
-
'ಳ': 'ḷa'
|
187
|
-
|
188
|
-
|
189
|
-
'ವ': 'va'
|
190
|
-
|
191
|
-
# Sibilants
|
192
|
-
'ಶ': 'sha'
|
193
|
-
'ಷ': 'ṣha'
|
194
|
-
'ಸ': 'sa'
|
195
|
-
|
196
|
-
|
197
|
-
# Aspirate
|
198
|
-
'ಹ': 'ha'
|
199
|
-
|
200
|
-
|
201
|
-
# Bisarga
|
202
|
-
'ಃ': 'ḥ'
|
203
|
-
|
204
|
-
# Anusvāra
|
205
|
-
'ಂ': 'ṁ'
|
206
|
-
|
207
|
-
'\u0cbc': '' #nukta
|
208
|
-
|
209
|
-
# Medials # Needed for connecting constants
|
210
|
-
'ಾ': "ā"
|
211
|
-
'ಿ': "i"
|
212
|
-
'ೀ': "ī"
|
213
|
-
'ು': "u"
|
214
|
-
'ೂ': "ū"
|
215
|
-
'ೃ': "ṛ"
|
216
|
-
|
217
|
-
|
218
|
-
'ೆ': "ĕ"
|
219
|
-
'ೇ': "e"
|
220
|
-
'ೈ': "ai"
|
221
|
-
|
222
|
-
|
223
|
-
'ೊ': 'ŏ'
|
224
|
-
'ೋ': 'o'
|
225
|
-
'ೌ': 'au'
|
226
|
-
|
227
|
-
|
228
|
-
'्': ''
|
229
|
-
'़': ''
|
230
|
-
'್': '' # used for pronounciation without vowel
|
231
|
-
"": '' # no need for zero with joiner
|
232
|
-
"": '' # no need for zero with non joiner
|
233
|
-
|
234
|
-
|
235
|
-
|
236
|
-
# Digits
|
237
|
-
|
238
|
-
'೦': '0'
|
239
|
-
'೧': '1'
|
240
|
-
'೨': '2'
|
241
|
-
'೩': '3'
|
242
|
-
'೪': '4'
|
243
|
-
'೫': '5'
|
244
|
-
'೬': '6'
|
245
|
-
'೭': '7'
|
246
|
-
'೮': '8'
|
247
|
-
'೯': '9'
|
248
|
-
|
249
|
-
|
250
|
-
|
251
|
-
|
252
|
-
|
253
|
-
|
254
|
-
|
@@ -1,251 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: un
|
3
|
-
id: 1972
|
4
|
-
language: iso-639-2:mal
|
5
|
-
source_script: Mlym
|
6
|
-
destination_script: Latn
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES --Malayalam Romanization Version 4.0
|
8
|
-
url: https://www.eki.ee/wgrs/rom1_ml.htm
|
9
|
-
creation_date: 1972
|
10
|
-
confirmation_date: 2016
|
11
|
-
description: |
|
12
|
-
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977 (III/12),
|
13
|
-
based on a report prepared by D. N. Sharma. The tables and their corrections were published in
|
14
|
-
volume II of the conference reports.
|
15
|
-
|
16
|
-
There is no evidence of the use of the system either in India or in international cartographic products.
|
17
|
-
|
18
|
-
Malayalam (Malayāḷam) uses an alphasyllabic script whereby each character represents a syllable rather
|
19
|
-
than one sound. Vowels and diphthongs are marked in two ways: as independent characters (used syllable-initially)
|
20
|
-
and in an abbreviated form, to denote vowels after consonants. The romanization table is unambiguous but now
|
21
|
-
outdated because since the 1970's a new orthography has been introduced and the use of many character
|
22
|
-
combinations and ligatures has been simplified. Nevertheless the user of the romanization table would have to
|
23
|
-
recognize many ligatures not given in the original table. The system is mostly reversible but there exist some
|
24
|
-
ambiguities in the romanization of vowels (independent vs. abbreviated characters) and
|
25
|
-
consonants (ligatures vs. character sequences), particularly in the case of older orthography.
|
26
|
-
|
27
|
-
|
28
|
-
notes:
|
29
|
-
- |
|
30
|
-
ടു For traditional script forms ഖു khu, മു mu, etc., exceptionally കു ku (ക്കു kku, ങ്കു ṅku), ഗു gu, ഛു chhu, ജു ju, ണു ṇu, തു tu, നു nu (ന്നു nnu), ഭു bhu, രു ru, ശു shu, ഹു hu
|
31
|
-
- |
|
32
|
-
ടൂ For traditional script forms ഖൂ khū, മൂ mū, etc., exceptionally കൂ kū, ഗൂ gū, ഛൂ chhū, ജൂ jū, ണൂ ṇū, തൂ tū, നൂ nū, ഭൂ bhū, രൂ rū, ശൂ shū, ഹൂ hū
|
33
|
-
- |
|
34
|
-
ടൃ Traditionally written in conjunction with the consonant character: കൃ kṛ .
|
35
|
-
- |
|
36
|
-
ടൗ In the older spelling: ൌ.
|
37
|
-
- |
|
38
|
-
ട് Indicates absence of the inherent short [a] vowel, e.g. ക് k , സ് s. Special, co-called chillu-forms of consonants with that symbol: ണ് ṇ, ന് n, ര് r, ല് l, ള് ḷ.
|
39
|
-
- |
|
40
|
-
റ Special ligature: റ്റ ṭ̈.
|
41
|
-
|
42
|
-
tests:
|
43
|
-
- source: "ചൈനയ്ക്കെതിരെ ലഡാക്കിൽ സദാസജ്ജം; യുഎസിൽനിന്ന് ൭൨,൫൦൦ സിഗ്–൧൬ റൈഫിൾ"
|
44
|
-
expected: "chainaykkĕtirĕ laḍākkil sadāsajjaṃ; yuĕsilninn 72,500 sig–16 ṟaiphiḷ"
|
45
|
-
- source: "സർഗഭൂമിക’യ്ക്കില്ല; ലളിതച്ചേച്ചി അങ്ങനെ പറഞ്ഞിട്ടുണ്ടാവില്ല: ആർഎൽവി രാമകൃഷ്ണൻ"
|
46
|
-
expected: "sargabhūmika’ykkilla; laḷitachchechchi aṅṅanĕ paṟaññiṭṭuṇṭāvilla: ārĕlvi rāmakṛṣhṇan"
|
47
|
-
- source: "സ്വർണക്കടത്ത്: ഫൈസൽ ഫരീദും റബിന്സും ദുബായിൽ അറസ്റ്റിലായെന്ന് എന്ഐഎ"
|
48
|
-
expected: "svarṇakkaṭatt: phaisal pharīduṃ ṟabinsuṃ dubāyil aṟasṟṟilāyĕnn ĕnaiĕ"
|
49
|
-
- source: "വരുമോ ചൈനയുടെ വാക്സീൻ?; ആഗോള ഉപയോഗത്തിന് ഡബ്ല്യുഎച്ച്ഒയുമായി ചർച്ച"
|
50
|
-
expected: "varumo chainayuṭĕ vāksīn?; āgoḷa upayogattin ḍablyuĕchchŏyumāyi charchcha"
|
51
|
-
- source: "കുട്ടികളുടെ മാനസിക പിരിമുറുക്കം മാറ്റാൻ പരിശീലനം; ക്ലാസുമായി പോക്സോ പ്രതി"
|
52
|
-
expected: "kuṭṭikaḷuṭĕ mānasika pirimuṟukkaṃ māṟṟān parishīlanaṃ; klāsumāyi pokso prati"
|
53
|
-
- source: "ആദ്യം അമിത് ഷാ, ഇപ്പോൾ മോദി; ബിജെപിയെ പുണരാൻ ജഗൻ; ആന്ധ്രയിലെ കരുനീക്കങ്ങൾ"
|
54
|
-
expected: "ādyaṃ amit ṣhā, ippoḷ modi; bijĕpiyĕ puṇarān jagan; āndhrayilĕ karunīkkaṅṅaḷ"
|
55
|
-
- source: "ലഹരിമരുന്ന് കേസ്: ബിനീഷ് കോടിയേരിയെ ഇഡി 6 മണിക്കൂർ ചോദ്യം ചെയ്തു"
|
56
|
-
expected: "laharimarunn kes: binīṣh koṭiyeriyĕ iḍi 6 maṇikkūr chodyaṃ chĕytu"
|
57
|
-
- source: "ഈന്തപ്പഴം വിതരണം ചെയ്തത് ശിവശങ്കര് പറഞ്ഞതു പ്രകാരം: ടി.വി അനുപമയുടെ മൊഴി"
|
58
|
-
expected: "īntappaḻaṃ vitaraṇaṃ chĕytat shivashaṅkar paṟaññatu prakāraṃ: ṭi.vi anupamayuṭĕ mŏḻi"
|
59
|
-
- source: "൫൦൦൦ മണിക്കൂർ കാത്തിരിക്കാൻ തയാറെന്ന് രാഹുൽ: ഒടുവിൽ വഴങ്ങി ഹരിയാന"
|
60
|
-
expected: "5000 maṇikkūr kāttirikkān tayāṟĕnn rāhul: ŏṭuvil vaḻaṅṅi hariyāna"
|
61
|
-
- source: "കാരണം ഷോര്ട്ട്സര്ക്യൂട്ടല്ല; കത്തിയത് ഫയല് മാത്രം, സാനിറ്റൈസര് ഉള്പ്പെടെ കത്തിയില്ല"
|
62
|
-
expected: "kāraṇaṃ ṣhorṭṭsarkyūṭṭalla; kattiyat phayal mātraṃ, sāniṟṟaisar uḷppĕṭĕ kattiyilla"
|
63
|
-
- source: "വിമൺ സയൻറിസ്റ്റ്സ് സ്കീം"
|
64
|
-
expected: "vimaṇ sayanṟisṟṟs skīṃ"
|
65
|
-
|
66
|
-
map:
|
67
|
-
|
68
|
-
rules:
|
69
|
-
- pattern: ([ക]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
70
|
-
result: 'k'
|
71
|
-
- pattern: ([ഖ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
72
|
-
result: 'kh'
|
73
|
-
- pattern: ([ഗ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
74
|
-
result: 'g'
|
75
|
-
- pattern: ([ഘ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
76
|
-
result: 'gh'
|
77
|
-
- pattern: ([ങ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
78
|
-
result: 'ṅ'
|
79
|
-
- pattern: ([ച]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
80
|
-
result: 'ch'
|
81
|
-
- pattern: ([ഛ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
82
|
-
result: 'chh'
|
83
|
-
- pattern: ([ജ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
84
|
-
result: 'j'
|
85
|
-
- pattern: ([ഝ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
86
|
-
result: 'jh'
|
87
|
-
- pattern: ([ഞ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
88
|
-
result: 'ñ'
|
89
|
-
- pattern: ([ട]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
90
|
-
result: 'ṭ'
|
91
|
-
- pattern: ([ഠ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
92
|
-
result: 'ṭh'
|
93
|
-
- pattern: ([ഡ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
94
|
-
result: 'ḍ'
|
95
|
-
- pattern: ([ഢ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
96
|
-
result: 'ḍh'
|
97
|
-
- pattern: ([ണ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
98
|
-
result: 'ṇ'
|
99
|
-
- pattern: ([ത]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
100
|
-
result: 't'
|
101
|
-
- pattern: ([ഥ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
102
|
-
result: 'th'
|
103
|
-
- pattern: ([ദ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
104
|
-
result: 'd'
|
105
|
-
- pattern: ([ധ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
106
|
-
result: 'dh'
|
107
|
-
- pattern: ([ന]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
108
|
-
result: 'n'
|
109
|
-
- pattern: ([പ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
110
|
-
result: 'p'
|
111
|
-
- pattern: ([ഫ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
112
|
-
result: 'ph'
|
113
|
-
- pattern: ([ബ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
114
|
-
result: 'b'
|
115
|
-
- pattern: ([ഭ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
116
|
-
result: 'bh'
|
117
|
-
- pattern: ([മ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
118
|
-
result: 'm'
|
119
|
-
- pattern: ([യ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
120
|
-
result: 'y'
|
121
|
-
- pattern: ([ര]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
122
|
-
result: 'r'
|
123
|
-
- pattern: ([ല]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
124
|
-
result: 'l'
|
125
|
-
- pattern: ([വ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
126
|
-
result: 'v'
|
127
|
-
- pattern: ([ശ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
128
|
-
result: 'sh'
|
129
|
-
- pattern: ([ഷ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
130
|
-
result: 'ṣh'
|
131
|
-
- pattern: ([സ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
132
|
-
result: 's'
|
133
|
-
- pattern: ([ഹ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
134
|
-
result: 'h'
|
135
|
-
- pattern: ([ള]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
136
|
-
result: 'ḷ'
|
137
|
-
- pattern: ([ഴ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
138
|
-
result: 'ḻ'
|
139
|
-
- pattern: ([റ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
140
|
-
result: 'ṟ'
|
141
|
-
- pattern: ([ക്ഷ]=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d43\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0d4d])
|
142
|
-
result: 'kṣh'
|
143
|
-
|
144
|
-
characters:
|
145
|
-
# I. Independent vowel characters
|
146
|
-
'അ': 'a'
|
147
|
-
'ആ': 'ā'
|
148
|
-
'ഇ': 'i'
|
149
|
-
'ഈ': 'ī'
|
150
|
-
'ഉ': 'u'
|
151
|
-
'ഊ': 'ū'
|
152
|
-
'ഋ': "ṛ"
|
153
|
-
'എ': 'ĕ'
|
154
|
-
'ഏ': 'e'
|
155
|
-
'ഐ': 'ai'
|
156
|
-
'ഒ': 'ŏ'
|
157
|
-
'ഓ': 'o'
|
158
|
-
'ഔ': 'au'
|
159
|
-
|
160
|
-
# II. Abbreviated vowel characters
|
161
|
-
'ാ': 'ā'
|
162
|
-
'ി': 'i'
|
163
|
-
'ീ': 'ī'
|
164
|
-
'ു': 'u'
|
165
|
-
'ൂ': 'ū'
|
166
|
-
'ൃ': "ṛ"
|
167
|
-
'െ': "ĕ"
|
168
|
-
'േ': "e"
|
169
|
-
'ൈ': "ai"
|
170
|
-
'ൊ': 'ŏ'
|
171
|
-
'ോ': 'o'
|
172
|
-
'ൌ': 'au'
|
173
|
-
|
174
|
-
#III. Other symbols
|
175
|
-
'ഃ': 'ḥ'
|
176
|
-
'ം': 'ṃ'
|
177
|
-
'്': ''
|
178
|
-
|
179
|
-
#IV. Consonant characters
|
180
|
-
'ക': 'ka'
|
181
|
-
'ഖ': 'kha'
|
182
|
-
'ഗ': 'ga'
|
183
|
-
'ഘ': 'gha'
|
184
|
-
'ങ': 'ṅa'
|
185
|
-
'ച': 'cha'
|
186
|
-
'ഛ': 'chha'
|
187
|
-
'ജ': 'ja'
|
188
|
-
'ഝ': 'jha'
|
189
|
-
'ഞ': 'ña'
|
190
|
-
'ട': 'ṭa'
|
191
|
-
'ഠ': 'ṭha'
|
192
|
-
'ഡ': 'ḍa'
|
193
|
-
'ഢ': 'ḍha'
|
194
|
-
'ണ': 'ṇa'
|
195
|
-
'ത': 'ta'
|
196
|
-
'ഥ': 'tha'
|
197
|
-
'ദ': 'da'
|
198
|
-
'ധ': 'dha'
|
199
|
-
'ന': 'na'
|
200
|
-
'പ': 'pa'
|
201
|
-
'ഫ': 'pha'
|
202
|
-
'ബ': 'ba'
|
203
|
-
'ഭ': 'bha'
|
204
|
-
'മ': 'ma'
|
205
|
-
'യ': 'ya'
|
206
|
-
'ര': 'ra'
|
207
|
-
'ല': 'la'
|
208
|
-
'വ': 'va'
|
209
|
-
'ശ': 'sha'
|
210
|
-
'ഷ': 'ṣha'
|
211
|
-
'സ': 'sa'
|
212
|
-
'ഹ': 'ha'
|
213
|
-
'ക്ഷ': 'kṣha'
|
214
|
-
'ള': 'ḷa'
|
215
|
-
'ഴ': 'ḻa'
|
216
|
-
'റ': 'ṟa'
|
217
|
-
'റ്റ': 'ṭ̈'
|
218
|
-
|
219
|
-
|
220
|
-
'्': ''
|
221
|
-
'़': ''
|
222
|
-
'ൗ': ''
|
223
|
-
"": '' # no need for zero with joiner
|
224
|
-
"": '' # no need for zero with non joiner
|
225
|
-
|
226
|
-
|
227
|
-
# numbers
|
228
|
-
'൦': '0'
|
229
|
-
'൧': '1'
|
230
|
-
'൨': '2'
|
231
|
-
'൩': '3'
|
232
|
-
'൪': '4'
|
233
|
-
'൫': '5'
|
234
|
-
'൬': '6'
|
235
|
-
'൭': '7'
|
236
|
-
'൮': '8'
|
237
|
-
'൯': '9'
|
238
|
-
'൰': '10'
|
239
|
-
'൱': '100'
|
240
|
-
'൲': '1000'
|
241
|
-
|
242
|
-
|
243
|
-
# chillu-forms of consonants note 5
|
244
|
-
'ൿ': 'k'
|
245
|
-
'ൺ': 'ṇ'
|
246
|
-
'ൻ': 'n'
|
247
|
-
'ൽ': 'l'
|
248
|
-
'ൾ': 'ḷ'
|
249
|
-
'ർ': 'r'
|
250
|
-
'സ്': 's'
|
251
|
-
|