interscript 0.1.9 → 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +80 -135
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +73 -458
- data/README.adoc +0 -296
- data/aliases.json +0 -1
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -96
- data/lib/interscript/mapping.rb +0 -144
- data/lib/interscript/opal.rb +0 -196
- data/lib/interscript/opal/entrypoint.rb +0 -20
- data/lib/interscript/opal/exports.rb +0 -11
- data/lib/interscript/opal/maps.js.erb +0 -8
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -259
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -55
- data/maps/alalc-aze-Arab-Latn-1997.yaml +0 -376
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-1997.yaml +0 -291
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-div-Thaa-Latn-1997.yaml +0 -211
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -303
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -65
- data/maps/alalc-kan-Kana-Latn-1997.yaml +0 -274
- data/maps/alalc-kan-Kana-Latn-2011.yaml +0 -63
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-ori-Orya-Latn-1997.yaml +0 -284
- data/maps/alalc-ori-Orya-Latn-2011.yaml +0 -67
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -241
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-tel-Telu-Latn-1997.yaml +0 -284
- data/maps/alalc-tel-Telu-Latn-2011.yaml +0 -64
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/az-aze-Cyrl-Latn-1939.yaml +0 -105
- data/maps/az-aze-Cyrl-Latn-1958.yaml +0 -45
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -598
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -111
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bal-Arab-Latn-2008.yaml +0 -329
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-div-Thaa-Latn-1988.yaml +0 -75
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-far-Latn-Latn-1964.yaml +0 -28
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-isl-Latn-Latn-1964.yaml +0 -37
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.yaml +0 -247
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.yaml +0 -218
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kur-Arab-Latn-2007.yaml +0 -249
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -338
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -673
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-pus-Arab-Latn-1968.yaml +0 -377
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.yaml +0 -73
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-urd-Arab-Latn-2007.yaml +0 -459
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-kan-Kana-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -175
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Kana-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/masm-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/masm-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mv-div-Thaa-Latn-1987.yaml +0 -200
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2004.yaml +0 -137
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -315
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2005.yaml +0 -90
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2004.yaml +0 -276
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2004.yaml +0 -182
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2005.yaml +0 -21
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-prs-Arab-Latn-2004.yaml +0 -123
- data/maps/odni-prs-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2005.yaml +0 -36
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-tuk-Cyrl-Latn-2015.yaml +0 -170
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -161
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-asm-Beng-Latn-1972.yaml +0 -223
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-guj-Gujr-Latn-1972.yaml +0 -229
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -316
- data/maps/un-kan-Kana-Latn-2016.yaml +0 -254
- data/maps/un-mal-Mlym-Latn-1972.yaml +0 -251
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -102
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -269
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-ori-Orya-Latn-1972.yaml +0 -247
- data/maps/un-pan-Guru-Latn-1972.yaml +0 -402
- data/maps/un-prs-Arab-Latn-1967.yaml +0 -236
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-tam-Taml-Latn-1972.yaml +0 -194
- data/maps/un-tel-Telu-Latn-1972.yaml +0 -270
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/un-urd-Arab-Latn-1972.yaml +0 -405
- data/maps/var-amh-Ethi-Latn-eae-2003.yaml +0 -466
- data/maps/var-gez-Ethi-Latn-eae-2003.yaml +0 -76
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -21
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -37
- data/spec/spec_helper.rb +0 -3
@@ -1,75 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: din
|
3
|
-
id: 33904-2018
|
4
|
-
language: iso-639-2:pli
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Pali"
|
8
|
-
url: https://www.beuth.de/en/standard/din-33904/293049024
|
9
|
-
creation_date: 2018
|
10
|
-
description: |
|
11
|
-
Pali system.
|
12
|
-
|
13
|
-
This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
|
14
|
-
It is suitable for any application.
|
15
|
-
|
16
|
-
notes:
|
17
|
-
- |
|
18
|
-
Vowels:
|
19
|
-
The Ardhacandra ॅ is often used to denote English vowels:
|
20
|
-
EXAMPLE
|
21
|
-
बॅट bêṭa (bat)
|
22
|
-
डॉक्टर ḍôkṭara (doctor)
|
23
|
-
- |
|
24
|
-
Consonants:
|
25
|
-
|
26
|
-
Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
|
27
|
-
Always written during transliteration, also in the final part
|
28
|
-
EXAMPLE 1
|
29
|
-
पुस्तक pustaka
|
30
|
-
|
31
|
-
A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
|
32
|
-
EXAMPLE 2
|
33
|
-
वाक् vāk
|
34
|
-
|
35
|
-
The anusvāra is always represented with -ṃ-.
|
36
|
-
EXAMPLE 3
|
37
|
-
संसकरण saṃskaraṇa
|
38
|
-
|
39
|
-
Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
|
40
|
-
EXAMPLE 4
|
41
|
-
तंघी kaṃghī becomes kaṅghī
|
42
|
-
पंजाबी paṃjābī becomes pañjābī
|
43
|
-
पंडित paṃḍita becomes paṇḍita
|
44
|
-
संधी saṃdhī becomes sandhī
|
45
|
-
दिसंबर disaṃbara becomes disambara
|
46
|
-
|
47
|
-
Anunāsika or Candrabindu signals the nasalization of vowels
|
48
|
-
|
49
|
-
EXAMPLE 5
|
50
|
-
माँ māṁ
|
51
|
-
|
52
|
-
tests:
|
53
|
-
- source: "तेन खो पन समयेन वेसालिया अविदूरे कलन्दगामो नाम अत्थि"
|
54
|
-
expected: "tena kho pana samayena vesāliyā avidūre kalandagāmo nāma atthi"
|
55
|
-
- source: "तत्थ सुदिन्नो नाम कलन्दपुत्तो सेट्ठिपुत्तो होति"
|
56
|
-
expected: "tattha sudinno nāma kalandaputto seṭṭhiputto hoti"
|
57
|
-
- source: "अथ खो सुदिन्नो कलन्दपुत्तो सम्बहुलेहि"
|
58
|
-
expected: "atha kho sudinno kalandaputto sambahulehi"
|
59
|
-
- source: "तथा चतुर्भिः पुरुषः परीक्ष्यते त्यागेन शीलेन गुणेन कर्मणा"
|
60
|
-
expected: "tathā caturbhiḥ puruṣaḥ parīkṣyate tyāgena śīlena guṇena karmaṇā"
|
61
|
-
- source: "अथ खो सुदिन्नो कलन्दपुत्तो अचिरवुट्ठिताय परिसाय येन भगवा तेनुपसङ्कमि; उपसङ्कमित्वा भगवन्तं अभिवादेत्वा एकमन्तं निसीदि"
|
62
|
-
expected: "atha kho sudinno kalandaputto aciravuṭṭhitāya parisāya yena bhagavā tenupasaṅkami; upasaṅkamitvā bhagavantaṃ abhivādetvā ekamantaṃ nisīdi"
|
63
|
-
- source: "अथ खो सुदिन्नस्स कलन्दपुत्तस्स मातापितरो सुदिन्नं कलन्दपुत्तं एतदवोचुं"
|
64
|
-
expected: "atha kho sudinnassa kalandaputtassa mātāpitaro sudinnaṃ kalandaputtaṃ etadavocuṃ"
|
65
|
-
- source: "त्वं खोसि, तात सुदिन्न, अम्हाकं एकपुत्तको पियो मनापो सुखेधितो सुखपरिहतो"
|
66
|
-
expected: "tvaṃ khosi, tāta sudinna, amhākaṃ ekaputtako piyo manāpo sukhedhito sukhaparihato"
|
67
|
-
- source: "न त्वं, तात सुदिन्न, किञ्चि दुक्खस्स जानासि"
|
68
|
-
expected: "na tvaṃ, tāta sudinna, kiñci dukkhassa jānāsi"
|
69
|
-
- source: "अनुञ्ञातोम्हि किर मातापितूहि अगारस्मा अनगारियं पब्बज्जाया’’ति, हट्ठो उदग्गो पाणिना गत्तानि परिपुञ्छन्तो वुट्ठासि"
|
70
|
-
expected: "anuññātomhi kira mātāpitūhi agārasmā anagāriyaṃ pabbajjāyā’’ti, haṭṭho udaggo pāṇinā gattāni paripuñchanto vuṭṭhāsi"
|
71
|
-
|
72
|
-
|
73
|
-
map:
|
74
|
-
|
75
|
-
inherit: 'din-san-Deva-Latn-33904-2018'
|
@@ -1,63 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: din
|
3
|
-
id: 33904-2018
|
4
|
-
language: iso-639-2:pra
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Prakit"
|
8
|
-
url: https://www.beuth.de/en/standard/din-33904/293049024
|
9
|
-
creation_date: 2018
|
10
|
-
description: |
|
11
|
-
Prakit system.
|
12
|
-
|
13
|
-
This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
|
14
|
-
It is suitable for any application.
|
15
|
-
|
16
|
-
notes:
|
17
|
-
- |
|
18
|
-
Vowels:
|
19
|
-
The Ardhacandra ॅ is often used to denote English vowels:
|
20
|
-
EXAMPLE
|
21
|
-
बॅट bêṭa (bat)
|
22
|
-
डॉक्टर ḍôkṭara (doctor)
|
23
|
-
- |
|
24
|
-
Consonants:
|
25
|
-
|
26
|
-
Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
|
27
|
-
Always written during transliteration, also in the final part
|
28
|
-
EXAMPLE 1
|
29
|
-
पुस्तक pustaka
|
30
|
-
|
31
|
-
A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
|
32
|
-
EXAMPLE 2
|
33
|
-
वाक् vāk
|
34
|
-
|
35
|
-
The anusvāra is always represented with -ṃ-.
|
36
|
-
EXAMPLE 3
|
37
|
-
संसकरण saṃskaraṇa
|
38
|
-
|
39
|
-
Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
|
40
|
-
EXAMPLE 4
|
41
|
-
तंघी kaṃghī becomes kaṅghī
|
42
|
-
पंजाबी paṃjābī becomes pañjābī
|
43
|
-
पंडित paṃḍita becomes paṇḍita
|
44
|
-
संधी saṃdhī becomes sandhī
|
45
|
-
दिसंबर disaṃbara becomes disambara
|
46
|
-
|
47
|
-
Anunāsika or Candrabindu signals the nasalization of vowels
|
48
|
-
|
49
|
-
EXAMPLE 5
|
50
|
-
माँ māṁ
|
51
|
-
|
52
|
-
tests:
|
53
|
-
- source: "सृष्टिस्थितिविनाशानां शक्तिभूते सनातनि"
|
54
|
-
expected: "sṛṣṭisthitivināśānāṃ śaktibhūte sanātani"
|
55
|
-
- source: "गुणाश्रये गुणमये नारायणि नमोऽस्तु ते"
|
56
|
-
expected: "guṇāśraye guṇamaye nārāyaṇi namo’stu te"
|
57
|
-
- source: "तेन समयेन बुद्धो भगवा सावत्थियं विहरति जेतवने अनाथपिण्डिकस्स आरामे"
|
58
|
-
expected: "tena samayena buddho bhagavā sāvatthiyaṃ viharati jetavane anāthapiṇḍikassa ārāme"
|
59
|
-
|
60
|
-
|
61
|
-
map:
|
62
|
-
|
63
|
-
inherit: 'din-san-Deva-Latn-33904-2018'
|
@@ -1,338 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: din
|
3
|
-
id: 33904-2018
|
4
|
-
language: iso-639-2:san
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: "DIN 33904:2018-10 Information and documentation - Romanization Devanagari, Sanskrit"
|
8
|
-
url: https://www.beuth.de/en/standard/din-33904/293049024
|
9
|
-
creation_date: 2018
|
10
|
-
description: |
|
11
|
-
Sanskrit system.
|
12
|
-
|
13
|
-
This standard specifies the transliteration of all languages of the Devanāgarī characters into Latin letters firmly.
|
14
|
-
It is suitable for any application.
|
15
|
-
|
16
|
-
notes:
|
17
|
-
- |
|
18
|
-
Vowels:
|
19
|
-
The Ardhacandra ॅ is often used to denote English vowels:
|
20
|
-
EXAMPLE
|
21
|
-
बॅट bêṭa (bat)
|
22
|
-
डॉक्टर ḍôkṭara (doctor)
|
23
|
-
- |
|
24
|
-
Consonants:
|
25
|
-
|
26
|
-
Since the Devanāgarī script is a syllabic script, it becomes -a inherent in the consonant.
|
27
|
-
Always written during transliteration, also in the final part
|
28
|
-
EXAMPLE 1
|
29
|
-
पुस्तक pustaka
|
30
|
-
|
31
|
-
A line under the consonant, the so-called Virāma, means in the Devanāgarī script that that inherent -a not applicable.
|
32
|
-
EXAMPLE 2
|
33
|
-
वाक् vāk
|
34
|
-
|
35
|
-
The anusvāra is always represented with -ṃ-.
|
36
|
-
EXAMPLE 3
|
37
|
-
संसकरण saṃskaraṇa
|
38
|
-
|
39
|
-
Before k, kh, g, gh, c, ch, j, jh, ṭ, ṭh, ḍ, ḍh, t, th, d, dh, p, ph, b, bh, the anusvāra becomes the class nasal transformed.
|
40
|
-
EXAMPLE 4
|
41
|
-
तंघी kaṃghī becomes kaṅghī
|
42
|
-
पंजाबी paṃjābī becomes pañjābī
|
43
|
-
पंडित paṃḍita becomes paṇḍita
|
44
|
-
संधी saṃdhī becomes sandhī
|
45
|
-
दिसंबर disaṃbara becomes disambara
|
46
|
-
|
47
|
-
Anunāsika or Candrabindu signals the nasalization of vowels
|
48
|
-
|
49
|
-
EXAMPLE 5
|
50
|
-
माँ māṁ
|
51
|
-
|
52
|
-
tests:
|
53
|
-
- source: "पुस्तक"
|
54
|
-
expected: "pustaka"
|
55
|
-
- source: "बॅट"
|
56
|
-
expected: "bêṭa"
|
57
|
-
- source: "वाक्"
|
58
|
-
expected: "vāk"
|
59
|
-
- source: "पंजाबी"
|
60
|
-
expected: "pañjābī"
|
61
|
-
- source: "डॉक्टर"
|
62
|
-
expected: "ḍôkṭara"
|
63
|
-
- source: "पंडित"
|
64
|
-
expected: "paṇḍita"
|
65
|
-
- source: "संधी"
|
66
|
-
expected: "sandhī"
|
67
|
-
- source: "दिसंबर"
|
68
|
-
expected: "disambara"
|
69
|
-
- source: "संसकरण"
|
70
|
-
expected: "saṃsakaraṇa"
|
71
|
-
- source: "माँ"
|
72
|
-
expected: "māṁ"
|
73
|
-
- source: "शुभाशुभपरित्यागी भक्तिमान्यः स मे प्रियः"
|
74
|
-
expected: "śubhāśubhaparityāgī bhaktimānyaḥ sa me priyaḥ"
|
75
|
-
- source: "सत्य -सत्यमेवेश्वरो लोके सत्ये धर्मः सदाश्रितः"
|
76
|
-
expected: "satya -satyameveśvaro loke satye dharmaḥ sadāśritaḥ"
|
77
|
-
- source: "सत्यमूलनि सर्वाणि सत्यान्नास्ति परं पदम्"
|
78
|
-
expected: "satyamūlani sarvāṇi satyānnāsti paraṃ padam"
|
79
|
-
- source: "पिता माताग्निरात्मा च गुरुश्च भरतर्षभ"
|
80
|
-
expected: "pitā mātāgnirātmā ca guruśca bharatarṣabha"
|
81
|
-
- source: "०१२३४५६७८९"
|
82
|
-
expected: "0123456789"
|
83
|
-
|
84
|
-
map:
|
85
|
-
|
86
|
-
rules:
|
87
|
-
- pattern: \u0902(?=[कक़खख़गग़घङ])
|
88
|
-
result: ṅ
|
89
|
-
- pattern: \u0902(?=[चछजज़झञ])
|
90
|
-
result: ñ
|
91
|
-
- pattern: \u0902(?=[टट़ठडड़ढढ़ण])
|
92
|
-
result: ṇ
|
93
|
-
- pattern: \u0902(?=[तथदधन])
|
94
|
-
result: n
|
95
|
-
- pattern: \u0902(?=[पफबभम])
|
96
|
-
result: m
|
97
|
-
|
98
|
-
- pattern: \u0902(?=[कखगघचछजझतथदधपफबभटठडढ])
|
99
|
-
result: "ñ"
|
100
|
-
|
101
|
-
- pattern: ([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
102
|
-
result: 'k'
|
103
|
-
- pattern: ([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
104
|
-
result: 'kh'
|
105
|
-
- pattern: ([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
106
|
-
result: 'g'
|
107
|
-
- pattern: ([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
108
|
-
result: 'gh'
|
109
|
-
- pattern: ([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
110
|
-
result: 'ṅ'
|
111
|
-
- pattern: ([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
112
|
-
result: 'c'
|
113
|
-
- pattern: ([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
114
|
-
result: 'ch'
|
115
|
-
- pattern: ([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
116
|
-
result: 'j'
|
117
|
-
- pattern: ([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
118
|
-
result: 'jh'
|
119
|
-
- pattern: ([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
120
|
-
result: 'ñ'
|
121
|
-
- pattern: ([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
122
|
-
result: 'ṭ'
|
123
|
-
- pattern: ([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
124
|
-
result: 'ṭh'
|
125
|
-
- pattern: ([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
126
|
-
result: 'ḍ'
|
127
|
-
- pattern: ([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
128
|
-
result: 'ḍh'
|
129
|
-
- pattern: ([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
130
|
-
result: 'ṇ'
|
131
|
-
- pattern: ([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
132
|
-
result: 't'
|
133
|
-
- pattern: ([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
134
|
-
result: 'th'
|
135
|
-
- pattern: ([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
136
|
-
result: 'd'
|
137
|
-
- pattern: ([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
138
|
-
result: 'dh'
|
139
|
-
- pattern: ([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
140
|
-
result: 'n'
|
141
|
-
- pattern: ([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
142
|
-
result: 'p'
|
143
|
-
- pattern: ([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
144
|
-
result: 'ph'
|
145
|
-
- pattern: ([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
146
|
-
result: 'b'
|
147
|
-
- pattern: ([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
148
|
-
result: 'bh'
|
149
|
-
- pattern: ([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
150
|
-
result: 'm'
|
151
|
-
- pattern: ([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
152
|
-
result: 'y'
|
153
|
-
- pattern: ([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
154
|
-
result: 'r'
|
155
|
-
- pattern: ([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
156
|
-
result: 'l'
|
157
|
-
- pattern: ([ळ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
158
|
-
result: 'ḷ'
|
159
|
-
- pattern: ([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
160
|
-
result: 'v'
|
161
|
-
- pattern: ([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
162
|
-
result: 'ś'
|
163
|
-
- pattern: ([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
164
|
-
result: 'ṣ'
|
165
|
-
- pattern: ([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
166
|
-
result: 's'
|
167
|
-
- pattern: ([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C])
|
168
|
-
result: 'h'
|
169
|
-
|
170
|
-
characters:
|
171
|
-
|
172
|
-
# I. Vowels and Diphthongs (see Note 1)
|
173
|
-
|
174
|
-
'अ': 'a'
|
175
|
-
'आ': 'ā'
|
176
|
-
'इ': 'i'
|
177
|
-
'ई': 'ī'
|
178
|
-
'उ': 'u'
|
179
|
-
'ऊ': 'ū'
|
180
|
-
'ऋ': 'ṛ'
|
181
|
-
'ॠ': 'ṝ'
|
182
|
-
'ऌ': 'ḷ'
|
183
|
-
'ए': 'e'
|
184
|
-
'ऎ': 'ĕ'
|
185
|
-
'ऐ': 'ai'
|
186
|
-
'ओ': 'o'
|
187
|
-
'ऒ': 'ŏ'
|
188
|
-
'औ': 'au'
|
189
|
-
|
190
|
-
|
191
|
-
# II. Consonants (see Note 2)
|
192
|
-
# Gutturals
|
193
|
-
'क': 'ka'
|
194
|
-
'ख': 'kha'
|
195
|
-
'ग': 'ga'
|
196
|
-
'घ': 'gha'
|
197
|
-
'ङ': 'ṅa'
|
198
|
-
|
199
|
-
# Palatals
|
200
|
-
'च': 'ca'
|
201
|
-
'छ': 'cha'
|
202
|
-
'ज': 'ja'
|
203
|
-
'झ': 'jha'
|
204
|
-
'ञ': 'ña'
|
205
|
-
|
206
|
-
# Cerebrals
|
207
|
-
'ट': 'ṭa'
|
208
|
-
'ठ': 'ṭha'
|
209
|
-
'ड': 'ḍa'
|
210
|
-
'ढ': 'ḍha'
|
211
|
-
'ण': 'ṇa'
|
212
|
-
|
213
|
-
# Dentals
|
214
|
-
'त': 'ta'
|
215
|
-
'थ': 'tha'
|
216
|
-
'द': 'da'
|
217
|
-
'ध': 'dha'
|
218
|
-
'न': 'na'
|
219
|
-
|
220
|
-
# Labials
|
221
|
-
'प': 'pa'
|
222
|
-
'फ': 'pha'
|
223
|
-
'ब': 'ba'
|
224
|
-
'भ': 'bha'
|
225
|
-
'म': 'ma'
|
226
|
-
|
227
|
-
# Semivowels
|
228
|
-
'य': 'ya'
|
229
|
-
'र': 'ra'
|
230
|
-
'ल': 'la'
|
231
|
-
'ळ': 'ḷa'
|
232
|
-
'व': 'va'
|
233
|
-
|
234
|
-
# Sibilants
|
235
|
-
'श': 'śa'
|
236
|
-
'ष': 'ṣa'
|
237
|
-
'स': 'sa'
|
238
|
-
|
239
|
-
# Aspirate
|
240
|
-
'ह': 'ha'
|
241
|
-
|
242
|
-
# Anusvāra
|
243
|
-
'ं': 'ṃ'
|
244
|
-
|
245
|
-
# Bisarga
|
246
|
-
'ः': 'ḥ'
|
247
|
-
|
248
|
-
# Anunāsika
|
249
|
-
'ँ': 'ṁ'
|
250
|
-
|
251
|
-
# Abagraha
|
252
|
-
'ऽ': '’' # (apostrophe)
|
253
|
-
|
254
|
-
# Medials # Needed for connecting constants
|
255
|
-
'ा': "ā"
|
256
|
-
'ि': "i"
|
257
|
-
'ी': "ī"
|
258
|
-
'ु': "u"
|
259
|
-
'ू': "ū"
|
260
|
-
'ृ': "ṛ"
|
261
|
-
'ॄ': "ṝ"
|
262
|
-
'◌': "ṝ"
|
263
|
-
'ॢ': "ḷ"
|
264
|
-
'ॣ': "ḹ"
|
265
|
-
'े': "e"
|
266
|
-
'ै': "ai"
|
267
|
-
'ो': "o"
|
268
|
-
'ौ': "au"
|
269
|
-
'ॉ': "ô"
|
270
|
-
'ॅ': "ê"
|
271
|
-
'': ''# Used for joining
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
# For consonant Virāma
|
276
|
-
# Gutturals
|
277
|
-
'क्': 'k'
|
278
|
-
'ख्': 'kh'
|
279
|
-
'ग्': 'g'
|
280
|
-
'घ्': 'gh'
|
281
|
-
'ङ्': 'ṅ'
|
282
|
-
|
283
|
-
# Palatals
|
284
|
-
'च्': 'c'
|
285
|
-
'छ्': 'ch'
|
286
|
-
'ज्': 'j'
|
287
|
-
'झ्': 'jh'
|
288
|
-
'ञ्': 'ñ'
|
289
|
-
|
290
|
-
# Cerebrals
|
291
|
-
'ट्': 'ṭ'
|
292
|
-
'ठ्': 'ṭh'
|
293
|
-
'ड्': 'ḍ'
|
294
|
-
'ढ्': 'ḍh'
|
295
|
-
'ण्': 'ṇ'
|
296
|
-
|
297
|
-
# Dentals
|
298
|
-
'त्': 't'
|
299
|
-
'थ्': 'th'
|
300
|
-
'द्': 'd'
|
301
|
-
'ध्': 'dh'
|
302
|
-
'न्': 'n'
|
303
|
-
|
304
|
-
# Labials
|
305
|
-
'प्': 'p'
|
306
|
-
'फ्': 'ph'
|
307
|
-
'ब्': 'b'
|
308
|
-
'भ्': 'bh'
|
309
|
-
'म्': 'm'
|
310
|
-
|
311
|
-
# Semivowels
|
312
|
-
'य्': 'y'
|
313
|
-
'र्': 'r'
|
314
|
-
'ल्': 'l'
|
315
|
-
'ळ्': 'ḷ'
|
316
|
-
'व्': 'v'
|
317
|
-
|
318
|
-
# Sibilants
|
319
|
-
'श्': 'ś'
|
320
|
-
'ष्': 'ṣ'
|
321
|
-
'स्': 's'
|
322
|
-
|
323
|
-
# Aspirate
|
324
|
-
'ह्': 'h'
|
325
|
-
|
326
|
-
# digits
|
327
|
-
|
328
|
-
'०': '0'
|
329
|
-
'१': '1'
|
330
|
-
'२': '2'
|
331
|
-
'३': '3'
|
332
|
-
'४': '4'
|
333
|
-
'५': '5'
|
334
|
-
'६': '6'
|
335
|
-
'७': '7'
|
336
|
-
'८': '8'
|
337
|
-
'९': '9'
|
338
|
-
|