interscript 0.1.7 → 2.1.0b1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +116 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +83 -133
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +68 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +68 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +76 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +68 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/interscript/visualize.rb +61 -0
- data/lib/interscript/visualize/group.html.erb +59 -0
- data/lib/interscript/visualize/json.rb +57 -0
- data/lib/interscript/visualize/map.html.erb +46 -0
- data/lib/interscript/visualize/nodes.rb +89 -0
- data/requirements.txt +1 -0
- metadata +78 -416
- data/README.adoc +0 -298
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -69
- data/lib/interscript/mapping.rb +0 -142
- data/lib/interscript/opal.rb +0 -57
- data/lib/interscript/opal/entrypoint.rb +0 -12
- data/lib/interscript/opal/map_translate.rb +0 -7
- data/lib/interscript/opal/maps.js.erb +0 -10
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -384
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -29
- data/spec/spec_helper.rb +0 -3
|
@@ -1,190 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: bgnpcgn
|
|
3
|
-
id: 2013
|
|
4
|
-
language: iso-639-2:mkd
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: Makedonian Romanization, BGN/PCGN 2013 System
|
|
8
|
-
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
|
|
9
|
-
creation_date: 2013
|
|
10
|
-
description: |
|
|
11
|
-
Macedonian was officially established as a written language in Yugoslavia during
|
|
12
|
-
World War II and is now the official language of North Macedonia.
|
|
13
|
-
This romanization system replaces the BGN/PCGN 1981 agreement and adheres
|
|
14
|
-
to the most widely-accepted standardization of Macedonian orthography.
|
|
15
|
-
|
|
16
|
-
notes:
|
|
17
|
-
- The Macedonian Cyrillic lowercase italic Д may sometimes be seen as g.
|
|
18
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
|
19
|
-
has been used here for illustrative purposes.
|
|
20
|
-
- The Macedonian Cyrillic lowercase italic Ѓ may sometimes be seen as ī.
|
|
21
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
|
22
|
-
has been used here for illustrative purposes.
|
|
23
|
-
- The Macedonian Cyrillic lowercase italic П may sometimes be seen as ū.
|
|
24
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
|
25
|
-
has been used here for illustrative purposes.
|
|
26
|
-
- The Macedonian Cyrillic lowercase italic Т may sometimes be seen as w̄.
|
|
27
|
-
There is no specific Unicode encoding for this variant form so a comparable character
|
|
28
|
-
has been used here for illustrative purposes.
|
|
29
|
-
- |
|
|
30
|
-
An inventory of letter-diacritic combinations, with their Unicode encoding,
|
|
31
|
-
in addition to the unmodified letters of the basic Roman script is:
|
|
32
|
-
| Ǵ (U+01F4) | ǵ (U+01F5) |
|
|
33
|
-
| Ž (U+017D) | ž (U+017E) |
|
|
34
|
-
| Dz (U+01F2)* | dz (U+01F3)* |
|
|
35
|
-
| Lj (U+01C8)* | lj (U+01C9)* |
|
|
36
|
-
| Nj (U+01CB)* | nj(U+01CC)* |
|
|
37
|
-
| Ḱ (U+IE30) | ḱ (U+IE31) |
|
|
38
|
-
| Č (U+010C) | č (U+010D) |
|
|
39
|
-
| Dž (U+01C5)* | dž (U+01C6)* |
|
|
40
|
-
| Š (U+0160) | š (U+0161) |
|
|
41
|
-
* Note that these characters can also be reproduced with individual letters (e.g. l+j).
|
|
42
|
-
- The Romanization column shows only lowercase forms but, when romanizing,
|
|
43
|
-
uppercase and lowercase Roman letters as appropriate should be used.
|
|
44
|
-
|
|
45
|
-
tests:
|
|
46
|
-
- source: Ѓенови Ливаѓе
|
|
47
|
-
expected: Ǵenovi Livaǵe
|
|
48
|
-
- source: ЛУЃЕ луѓе
|
|
49
|
-
expected: LUǴE luǵe
|
|
50
|
-
- source: ЅВЕЗДА ѕвезда Ѕвезда
|
|
51
|
-
expected: DZVEZDA dzvezda Dzvezda
|
|
52
|
-
- source: Јабежица
|
|
53
|
-
expected: Jabežica
|
|
54
|
-
- source: Љиќен и Бард
|
|
55
|
-
expected: Ljiḱen i Bard
|
|
56
|
-
- source: Ќамилов Чукар
|
|
57
|
-
expected: Ḱamilov Čukar
|
|
58
|
-
- source: Џавидин Кајнак
|
|
59
|
-
expected: Džavidin Kajnak
|
|
60
|
-
- source: Џамалџи
|
|
61
|
-
expected: Džamaldži
|
|
62
|
-
- source: Џибра Гури и Зи
|
|
63
|
-
expected: Džibra Guri i Zi
|
|
64
|
-
- source: Абазова Куќарица
|
|
65
|
-
expected: Abazova Kuḱarica
|
|
66
|
-
- source: Баба Анѓина Маала
|
|
67
|
-
expected: Baba Anǵina Maala
|
|
68
|
-
- source: Ваљановец
|
|
69
|
-
expected: Valjanovec
|
|
70
|
-
- source: Галал Једи Дереш
|
|
71
|
-
expected: Galal Jedi Dereš
|
|
72
|
-
- source: Дванаесет Клајнци
|
|
73
|
-
expected: Dvanaeset Klajnci
|
|
74
|
-
- source: Електродистрибуција Струга
|
|
75
|
-
expected: Elektrodistribucija Struga
|
|
76
|
-
- source: Железничка Станица Рајко Жинзифов
|
|
77
|
-
expected: Železnička Stanica Rajko Žinzifov
|
|
78
|
-
- source: Заедничко Речиште
|
|
79
|
-
expected: Zaedničko Rečište
|
|
80
|
-
- source: Испраена Плоча
|
|
81
|
-
expected: Ispraena Ploča
|
|
82
|
-
- source: Казнено-Поправна Установа Идризово
|
|
83
|
-
expected: Kazneno-Popravna Ustanova Idrizovo
|
|
84
|
-
- source: Лази и Зејнелит
|
|
85
|
-
expected: Lazi i Zejnelit
|
|
86
|
-
- source: Мавровско Езеро
|
|
87
|
-
expected: Mavrovsko Ezero
|
|
88
|
-
- source: Национален Парк Галичица
|
|
89
|
-
expected: Nacionalen Park Galičica
|
|
90
|
-
- source: Одморалиште Свети Стефан
|
|
91
|
-
expected: Odmoralište Sveti Stefan
|
|
92
|
-
- source: Планинарски Дом Караџица
|
|
93
|
-
expected: Planinarski Dom Karadžica
|
|
94
|
-
- source: Раса е Лисењит
|
|
95
|
-
expected: Rasa e Lisenjit
|
|
96
|
-
- source: Скочивирска Клисура
|
|
97
|
-
expected: Skočivirska Klisura
|
|
98
|
-
- source: Термо-електроцентрала Неготино
|
|
99
|
-
expected: Termo-elektrocentrala Negotino
|
|
100
|
-
- source: Узуновско Бресје
|
|
101
|
-
expected: Uzunovsko Bresje
|
|
102
|
-
- source: Фабрика Југохром
|
|
103
|
-
expected: Fabrika Jugohrom
|
|
104
|
-
- source: Хидроелектрана Сапунџица
|
|
105
|
-
expected: Hidroelektrana Sapundžica
|
|
106
|
-
- source: Цветковско Рамниште
|
|
107
|
-
expected: Cvetkovsko Ramnište
|
|
108
|
-
- source: Чалтанова Пештера
|
|
109
|
-
expected: Čaltanova Peštera
|
|
110
|
-
- source: Шкемби Вишнејц
|
|
111
|
-
expected: Škembi Višnejc
|
|
112
|
-
|
|
113
|
-
map:
|
|
114
|
-
postrules:
|
|
115
|
-
# DZ
|
|
116
|
-
- pattern: "((?<=[[:upper:]])Dz(?=[[:upper:]])?|(?<=[[:upper:]])?Dz(?=[[:upper:]]))"
|
|
117
|
-
result: "DZ"
|
|
118
|
-
#LJ
|
|
119
|
-
- pattern: "((?<=[[:upper:]])Lj(?=[[:upper:]])?|(?<=[[:upper:]])?Lj(?=[[:upper:]]))"
|
|
120
|
-
result: "LJ"
|
|
121
|
-
#NJ
|
|
122
|
-
- pattern: "((?<=[[:upper:]])Nj(?=[[:upper:]])?|(?<=[[:upper:]])?Nj(?=[[:upper:]]))"
|
|
123
|
-
result: "NJ"
|
|
124
|
-
#DŽ
|
|
125
|
-
- pattern: "((?<=[[:upper:]])Dž(?=[[:upper:]])?|(?<=[[:upper:]])?Dž(?=[[:upper:]]))"
|
|
126
|
-
result: "DŽ"
|
|
127
|
-
|
|
128
|
-
characters:
|
|
129
|
-
"\u0410": "A"
|
|
130
|
-
"\u0411": "B"
|
|
131
|
-
"\u0412": "V"
|
|
132
|
-
"\u0413": "G"
|
|
133
|
-
"\u0414": "D"
|
|
134
|
-
"\u0403": "\u01F4" # Ǵ
|
|
135
|
-
"\u0415": "E"
|
|
136
|
-
"\u0416": "\u005a\u030c" # Ž
|
|
137
|
-
"\u0417": "Z"
|
|
138
|
-
"\u0405": "Dz"
|
|
139
|
-
"\u0418": "I"
|
|
140
|
-
"\u0408": "J"
|
|
141
|
-
"\u041A": "K"
|
|
142
|
-
"\u041B": "L"
|
|
143
|
-
"\u0409": "Lj"
|
|
144
|
-
"\u041C": "M"
|
|
145
|
-
"\u041D": "N"
|
|
146
|
-
"\u040A": "Nj"
|
|
147
|
-
"\u041E": "O"
|
|
148
|
-
"\u041F": "P"
|
|
149
|
-
"\u0420": "R"
|
|
150
|
-
"\u0421": "S"
|
|
151
|
-
"\u0422": "T"
|
|
152
|
-
"\u040C": "\u004b\u0301" # Ḱ
|
|
153
|
-
"\u0423": "U"
|
|
154
|
-
"\u0424": "F"
|
|
155
|
-
"\u0425": "H"
|
|
156
|
-
"\u0426": "C"
|
|
157
|
-
"\u0427": "\u0043\u030c" # Č
|
|
158
|
-
"\u040F": "D\u007a\u030c" # Dž
|
|
159
|
-
"\u0428": "\u0053\u030c" # Š
|
|
160
|
-
"\u0430": "a"
|
|
161
|
-
"\u0431": "b"
|
|
162
|
-
"\u0432": "v"
|
|
163
|
-
"\u0433": "g"
|
|
164
|
-
"\u0434": "d"
|
|
165
|
-
"\u0453": "\u01F5" # ǵ
|
|
166
|
-
"\u0435": "e"
|
|
167
|
-
"\u0436": "\u007a\u030c" # ž
|
|
168
|
-
"\u0437": "z"
|
|
169
|
-
"\u0455": "dz"
|
|
170
|
-
"\u0438": "i"
|
|
171
|
-
"\u0458": "j"
|
|
172
|
-
"\u043A": "k"
|
|
173
|
-
"\u043B": "l"
|
|
174
|
-
"\u0459": "lj"
|
|
175
|
-
"\u043C": "m"
|
|
176
|
-
"\u043D": "n"
|
|
177
|
-
"\u045A": "nj"
|
|
178
|
-
"\u043E": "o"
|
|
179
|
-
"\u043F": "p"
|
|
180
|
-
"\u0440": "r"
|
|
181
|
-
"\u0441": "s"
|
|
182
|
-
"\u0442": "t"
|
|
183
|
-
"\u045C": "\u1E31" # ḱ
|
|
184
|
-
"\u0443": "u"
|
|
185
|
-
"\u0444": "f"
|
|
186
|
-
"\u0445": "h"
|
|
187
|
-
"\u0446": "c"
|
|
188
|
-
"\u0447": "\u0063\u030c" # č
|
|
189
|
-
"\u045F": "d\u007a\u030c" # dž
|
|
190
|
-
"\u0448": "\u0073\u030c" # š
|
|
@@ -1,223 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: bgnpcgn
|
|
3
|
-
id: 1964
|
|
4
|
-
language: iso-639-2:mon
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: BGN/PCGN 1964 System
|
|
8
|
-
alias:
|
|
9
|
-
ogc11122:
|
|
10
|
-
code: mon_Cyrl2Latn_BGN_1964
|
|
11
|
-
description: Mongolian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1964 System
|
|
12
|
-
url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
|
|
13
|
-
creation_date:
|
|
14
|
-
confirmation_date:
|
|
15
|
-
description: |
|
|
16
|
-
This system was originated by the PCGN in 1957 and adopted as a
|
|
17
|
-
BGN/PCGN System in 1964. It is intended for use in the romanization of
|
|
18
|
-
geographic names in the "Mongolian People's Republic" but not to romanize
|
|
19
|
-
Mongolian names in adjacent parts of China and the U.S.S.R.
|
|
20
|
-
|
|
21
|
-
notes: |
|
|
22
|
-
- b occurs initially and after л, м, and б.
|
|
23
|
-
- v occurs medially in Mongolian words and initially in foreign words.
|
|
24
|
-
- y occurs only as the second element of diphthongs.
|
|
25
|
-
- k, p, f, and shch occurs foreign words only.
|
|
26
|
-
- "\u2019" occurs only in Russion words.
|
|
27
|
-
- ï occurs only in suffixes to words containing back vowels (a, o, and u).
|
|
28
|
-
- In monosyllables yu or yü depending on pronunciation; in polysyllables yu when followed by a, o, or u, but yü when followed by i, e, ö, or ü.
|
|
29
|
-
|
|
30
|
-
tests:
|
|
31
|
-
- source: Эрдэнэт Сум
|
|
32
|
-
expected: Erdenet Sum
|
|
33
|
-
- source: Эрдэнэт
|
|
34
|
-
expected: Erdenet
|
|
35
|
-
- source: Эрдэнэ
|
|
36
|
-
expected: Erdene
|
|
37
|
-
- source: Шивээговь Сум
|
|
38
|
-
expected: Shiveegovĭ Sum
|
|
39
|
-
- source: Шивээговь
|
|
40
|
-
expected: Shiveegovĭ
|
|
41
|
-
- source: Шарынгол Сум
|
|
42
|
-
expected: Sharïngol Sum
|
|
43
|
-
- source: Шарынгол
|
|
44
|
-
expected: Sharïngol
|
|
45
|
-
- source: Цагааннуур
|
|
46
|
-
expected: Tsagaannuur
|
|
47
|
-
- source: Хонгор Сум
|
|
48
|
-
expected: Hongor Sum
|
|
49
|
-
- source: Хонгор
|
|
50
|
-
expected: Hongor
|
|
51
|
-
- source: Хайлаастай
|
|
52
|
-
expected: Haylaastay
|
|
53
|
-
- source: Түнэл Сум
|
|
54
|
-
expected: Tünel Sum
|
|
55
|
-
- source: Түнэл
|
|
56
|
-
expected: Tünel
|
|
57
|
-
- source: Сүхбаатар
|
|
58
|
-
expected: Sühbaatar
|
|
59
|
-
- source: Сүмбэр Сум
|
|
60
|
-
expected: Sümber Sum
|
|
61
|
-
- source: Сүмбэр
|
|
62
|
-
expected: Sümber
|
|
63
|
-
- source: Сайншанд Сум
|
|
64
|
-
expected: Saynshand Sum
|
|
65
|
-
- source: Сайншанд
|
|
66
|
-
expected: Saynshand
|
|
67
|
-
- source: Орхон Сум
|
|
68
|
-
expected: Orhon Sum
|
|
69
|
-
- source: Орхон
|
|
70
|
-
expected: Orhon
|
|
71
|
-
- source: Нарст
|
|
72
|
-
expected: Narst
|
|
73
|
-
- source: Мөрөн Сум
|
|
74
|
-
expected: Mörön Sum
|
|
75
|
-
- source: Мөрөн
|
|
76
|
-
expected: Mörön
|
|
77
|
-
- source: Зүүнхөвөө
|
|
78
|
-
expected: Dzüünhövöö
|
|
79
|
-
- source: Жаргалант Сум
|
|
80
|
-
expected: Jargalant Sum
|
|
81
|
-
- source: Жаргалант
|
|
82
|
-
expected: Jargalant
|
|
83
|
-
- source: Дархан Сум
|
|
84
|
-
expected: Darhan Sum
|
|
85
|
-
- source: Даланзадгад Сум
|
|
86
|
-
expected: Dalandzadgad Sum
|
|
87
|
-
- source: Даланзадгад
|
|
88
|
-
expected: Dalandzadgad
|
|
89
|
-
- source: Давст Сум
|
|
90
|
-
expected: Davst Sum
|
|
91
|
-
- source: Давст
|
|
92
|
-
expected: Davst
|
|
93
|
-
- source: Говьсүмбэр Сум
|
|
94
|
-
expected: Govĭsümber Sum
|
|
95
|
-
- source: Говь
|
|
96
|
-
expected: Govĭ
|
|
97
|
-
- source: Буга
|
|
98
|
-
expected: Buga
|
|
99
|
-
- source: Бор-Өндөр Сум
|
|
100
|
-
expected: Bor-Öndör Sum
|
|
101
|
-
- source: Бор-Өндөр
|
|
102
|
-
expected: Bor-Öndör
|
|
103
|
-
- source: Баянхонгор
|
|
104
|
-
expected: Bayanhongor
|
|
105
|
-
- source: Баянтал
|
|
106
|
-
expected: Bayantal
|
|
107
|
-
- source: Баяндэлгэр Сум
|
|
108
|
-
expected: Bayandelger Sum
|
|
109
|
-
- source: Баяндэлгэр
|
|
110
|
-
expected: Bayandelger
|
|
111
|
-
- source: Баян-Өндөр Сум
|
|
112
|
-
expected: Bayan-Öndör Sum
|
|
113
|
-
- source: Баруун-Урт Сум
|
|
114
|
-
expected: Baruun-Urt Sum
|
|
115
|
-
- source: Баруун-Урт
|
|
116
|
-
expected: Baruun-Urt
|
|
117
|
-
- source: Архуст
|
|
118
|
-
expected: Arhust
|
|
119
|
-
- source: Арвайхээр Сум
|
|
120
|
-
expected: Arvayheer Sum
|
|
121
|
-
- source: Арвайхээр
|
|
122
|
-
expected: Arvayheer
|
|
123
|
-
- source: Есөнбулаг Сум
|
|
124
|
-
expected: Yösönbulag Sum
|
|
125
|
-
- source: Ерөө Сум
|
|
126
|
-
expected: Yöröö Sum
|
|
127
|
-
- source: Есөнзүйл Сум
|
|
128
|
-
expected: Yösöndzüyl Sum
|
|
129
|
-
- source: Ноён Сум
|
|
130
|
-
expected: Noyon Sum
|
|
131
|
-
- source: Родник Балянгийн-Булак
|
|
132
|
-
expected: Rodnik Balyangiyn-Bulak
|
|
133
|
-
- source: Замын-Үүд Сум
|
|
134
|
-
expected: Dzamïn-Üüd Sum
|
|
135
|
-
- source: Адаацаг Сум
|
|
136
|
-
expected: Adaatsag Sum
|
|
137
|
-
- source: Чандмань Сум
|
|
138
|
-
expected: Chandmanĭ Sum
|
|
139
|
-
- source: Хяргас Сум
|
|
140
|
-
expected: Hyargas Sum
|
|
141
|
-
|
|
142
|
-
map:
|
|
143
|
-
rules:
|
|
144
|
-
- pattern: \u042e(?=[АаОоУу]) # Ю before а, о, or у
|
|
145
|
-
result: "Yu"
|
|
146
|
-
- pattern: \u044e(?=[АаОоУу]) # ю before а, о, or у
|
|
147
|
-
result: "yu"
|
|
148
|
-
- pattern: \u042e(?=[ИиЭэӨөҮү]) # Ю before и, э, ө, or ү
|
|
149
|
-
result: "Yü"
|
|
150
|
-
- pattern: \u044e(?=[ИиЭэӨөҮү]) # ю before и, э, ө, or ү
|
|
151
|
-
result: "yü"
|
|
152
|
-
|
|
153
|
-
characters:
|
|
154
|
-
"А": "A" # \u0410
|
|
155
|
-
"Б": "B" # \u0411
|
|
156
|
-
"В": "V" # \u0412
|
|
157
|
-
"Г": "G" # \u0413
|
|
158
|
-
"Д": "D" # \u0414
|
|
159
|
-
"Е": "Yö" # \u0415
|
|
160
|
-
"Ё": "Yo" # \u0401
|
|
161
|
-
"Ж": "J" # \u0416
|
|
162
|
-
"З": "Dz" # \u0417
|
|
163
|
-
"И": "I" # \u0418
|
|
164
|
-
"Й": "Y" # \u0419
|
|
165
|
-
"К": "K" # \u041a
|
|
166
|
-
"Л": "L" # \u041b
|
|
167
|
-
"М": "M" # \u041c
|
|
168
|
-
"Н": "N" # \u041d
|
|
169
|
-
"О": "O" # \u041e
|
|
170
|
-
"Ө": "Ö" # \u04e8
|
|
171
|
-
"П": "P" # \u041f
|
|
172
|
-
"Р": "R" # \u0420
|
|
173
|
-
"С": "S" # \u0421
|
|
174
|
-
"Т": "T" # \u0422
|
|
175
|
-
"У": "U" # \u0423
|
|
176
|
-
"Ү": "Ü" # \u04ae
|
|
177
|
-
"Ф": "F" # \u0424
|
|
178
|
-
"Х": "H" # \u0425
|
|
179
|
-
"Ц": "Ts" # \u0426
|
|
180
|
-
"Ч": "Ch" # \u0427
|
|
181
|
-
"Ш": "Sh" # \u0428
|
|
182
|
-
"Щ": "Shch" # \u0429
|
|
183
|
-
"Ъ": "\u2019" # \u042a
|
|
184
|
-
"Ы": "Ï" # \u042b
|
|
185
|
-
"Ь": "Ĭ" # \u042c
|
|
186
|
-
"Э": "E" # \u042d
|
|
187
|
-
"Ю": "Yu" # \u042e
|
|
188
|
-
"Я": "Ya" # \u042f
|
|
189
|
-
"а": "a" # \u0430
|
|
190
|
-
"б": "b" # \u0431
|
|
191
|
-
"в": "v" # \u0432
|
|
192
|
-
"г": "g" # \u0433
|
|
193
|
-
"д": "d" # \u0434
|
|
194
|
-
"е": "yö" # \u0435
|
|
195
|
-
"ё": "yo" # \u0451
|
|
196
|
-
"ж": "j" # \u0436
|
|
197
|
-
"з": "dz" # \u0437
|
|
198
|
-
"и": "i" # \u0438
|
|
199
|
-
"й": "y" # \u0439
|
|
200
|
-
"к": "k" # \u043a
|
|
201
|
-
"л": "l" # \u043b
|
|
202
|
-
"м": "m" # \u043c
|
|
203
|
-
"н": "n" # \u043d
|
|
204
|
-
"о": "o" # \u043e
|
|
205
|
-
"ө": "ö" # \u04e9
|
|
206
|
-
"п": "p" # \u043f
|
|
207
|
-
"р": "r" # \u0440
|
|
208
|
-
"с": "s" # \u0441
|
|
209
|
-
"т": "t" # \u0442
|
|
210
|
-
"у": "u" # \u0443
|
|
211
|
-
"ү": "ü" # \u04af
|
|
212
|
-
"ф": "f" # \u0444
|
|
213
|
-
"х": "h" # \u0445
|
|
214
|
-
"ц": "ts" # \u0446
|
|
215
|
-
"ч": "ch" # \u0447
|
|
216
|
-
"ш": "sh" # \u0448
|
|
217
|
-
"щ": "shch" # \u0449
|
|
218
|
-
"ъ": "\u2019" # \u044a
|
|
219
|
-
"ы": "ï" # \u044b
|
|
220
|
-
"ь": "ĭ" # \u044c
|
|
221
|
-
"э": "e" # \u044d
|
|
222
|
-
"ю": "yu" # \u044e
|
|
223
|
-
"я": "ya" # \u044f
|
|
@@ -1,230 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: bgnpcgn
|
|
3
|
-
id: 2020
|
|
4
|
-
language: iso-639-2:nep
|
|
5
|
-
source_script: Deva
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: Nepali Romanization, 2020
|
|
8
|
-
url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20NEPALI.pdf
|
|
9
|
-
creation_date: 1964
|
|
10
|
-
description: |
|
|
11
|
-
BGN/PCGN 2011 Agreement Romanization of Nepali
|
|
12
|
-
The BGN and the PCGN have adopted the Nepal Survey Department (NSD) system for the
|
|
13
|
-
romanization of Nepali names. This system, below, should be applied to Nepali names for which Roman‐
|
|
14
|
-
script spellings in materials produced by the government of Nepal are not available.
|
|
15
|
-
|
|
16
|
-
notes:
|
|
17
|
-
|
|
18
|
-
- Only the isolated forms of the characters are given in the consonant table. See any grammar of Nepali
|
|
19
|
-
(or other language using the Devanagari alphabet) for variant forms used in conjunct characters.
|
|
20
|
-
- These two consonant characters appear sometimes to represent ṛ (cerebral r), e.g., पहाड → pahāṛ
|
|
21
|
-
instead of pahāḍ. At one time they were written with dots below, i.e., as ड़ and ढ़, though this is no
|
|
22
|
-
longer normal practice in Nepali. The romanizations ṛ and ṛh, respectively, are optional for
|
|
23
|
-
documentary purposes if such dots appear in Nepali writing.
|
|
24
|
-
- व , can be romanized as either v or w. This character is primarily
|
|
25
|
-
romanized as v in consonant initial, medial, and final position; however, initial, medial, and final w
|
|
26
|
-
romanizations can occur. The w romanization is a special case which is believed to be dependent on
|
|
27
|
-
dialect, pronunciation, or stress.
|
|
28
|
-
- |
|
|
29
|
-
An inventory of letter‐diacritic combinations, with their Unicode encoding, in addition to the unmodified letters of the basic Roman script is:
|
|
30
|
-
Ṅ(U+1E44) ṅ (U+1E45)
|
|
31
|
-
Ñ (U+00D1) ñ (U+00F1)
|
|
32
|
-
Ṭ (1E6C) ṭ (1E6D)
|
|
33
|
-
Ḍ (1E0C) ḍ (1E0D)
|
|
34
|
-
Ṇ (1E46) ṇ (1E47)
|
|
35
|
-
Ṣ (1E62) ṣ (1E63)
|
|
36
|
-
Ā (U+0100) ā (U+0101)
|
|
37
|
-
Ī (U+012A) ī (U+012B)
|
|
38
|
-
Ū (U+016A) ū (U+016B)
|
|
39
|
-
Ṛ (1E5A) ṛ (1E5B)
|
|
40
|
-
|
|
41
|
-
- The Romanization column shows only lowercase forms but, when romanizing, uppercase and lowercase
|
|
42
|
-
Roman letters as appropriate should be used.
|
|
43
|
-
|
|
44
|
-
- |
|
|
45
|
-
ं (anusvara) is rendered by
|
|
46
|
-
ṅ before क, ख, ग, and घ
|
|
47
|
-
ñ before च, छ, ज, and झ
|
|
48
|
-
ṇ before ट, ठ, ड, and ढ
|
|
49
|
-
n before त, थ, द, and ध
|
|
50
|
-
ṁ before य, र, ल, व, श, ष, स and ह
|
|
51
|
-
|
|
52
|
-
tests:
|
|
53
|
-
- source: "लेखन"
|
|
54
|
-
expected: "lekhn"
|
|
55
|
-
- source: "मुद्रा"
|
|
56
|
-
expected: "mudarā"
|
|
57
|
-
- source: "प्रशंसा"
|
|
58
|
-
expected: "parshṃsā" # note 5 rule checking
|
|
59
|
-
- source: "अंक"
|
|
60
|
-
expected: "aṅk" # note 5 rule checking
|
|
61
|
-
- source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
|
|
62
|
-
expected: "nekpāle sathgit sathāyī kmiṭīko baiṭhk bhdau gte bolāune bheko"
|
|
63
|
-
- source: "न घर रह्यो, न परिवार"
|
|
64
|
-
expected: "n ghr rhayo, n privār"
|
|
65
|
-
- source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
|
|
66
|
-
expected: "ḍhorpāṭnmā bhujīkholā bāḍhīphirole abhibhāvk gumāekā bālbālikāko bichlalī"
|
|
67
|
-
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
|
68
|
-
expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
|
|
69
|
-
- source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
|
|
70
|
-
expected: "sṃvidhān jārī bhes~gai sāravjnik parshāsnmā nyā~ utasāh āune apekṣā thiyo"
|
|
71
|
-
- source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
|
|
72
|
-
expected: "deshmā koronā sṅkarmit r mṛitkko sṅkhayā hrek din bḍhado chh"
|
|
73
|
-
- source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
|
|
74
|
-
expected: "gāu~pālikākā adhaykṣ ṭikā guruṅkā anusār viṣaṇudāslāī rājule sutankā lāgi belukā sāthī lgekā thie"
|
|
75
|
-
- source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
|
|
76
|
-
expected: "yo āyojnā gāu~pālikāko kenadar telalokmā prachh"
|
|
77
|
-
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
|
78
|
-
expected: "susamitākā kākā hembhādur r kākīlāī pni phirole bgāyo"
|
|
79
|
-
- source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
|
|
80
|
-
expected: "chait philo sātā ghr āekā unī lkḍāun bhepchhi ytai rokie"
|
|
81
|
-
- source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
|
|
82
|
-
expected: "kām gran jāneko hkmā rojgārdātā kmapnīko ptrs~gai vḍā r jilalā parshāsnko siphāris anivāray grieko chh"
|
|
83
|
-
- source: "दुःख"
|
|
84
|
-
expected: "duḥkh"
|
|
85
|
-
- source: "निकुञ्जको स्थानीय पोस्टका कर्मचारी पनि त्यहीँ थिए"
|
|
86
|
-
expected: "nikuñajko sathānīy posaṭkā kramchārī pni tayhī~ thie"
|
|
87
|
-
- source: "युद्धकालको मनोविज्ञान"
|
|
88
|
-
expected: "yudadhkālko mnovijñān"
|
|
89
|
-
- source: "जर्मन वायुसेवाको आक्रमणमा दुई लाख पचास हजार मानिसको ज्यान जानसक्ने र करिब ३० देखि ४० लाख मान्छे विस्थापित हुने अनुमान बेलायत सरकारको थियो"
|
|
90
|
-
expected: "jramn vāyusevāko ākarmṇmā duī lākh pchās hjār mānisko jayān jānskane r krib 30 dekhi 40 lākh mānachhe visathāpit hune anumān belāyt srkārko thiyo"
|
|
91
|
-
- source: "युद्ध"
|
|
92
|
-
expected: "yudadh"
|
|
93
|
-
- source: "कोरोनासँग जम्काभेट"
|
|
94
|
-
expected: "koronās~g jmakābheṭ"
|
|
95
|
-
- source: "संक्रमित"
|
|
96
|
-
expected: "sṅkarmit"
|
|
97
|
-
- source: "स्वयम्"
|
|
98
|
-
expected: "savyma"
|
|
99
|
-
- source: "संख्या"
|
|
100
|
-
expected: "sṅkhayā"
|
|
101
|
-
- source: "गौरीटारस्थित रंगशाला"
|
|
102
|
-
expected: "gaurīṭārsathit rṅgshālā"
|
|
103
|
-
|
|
104
|
-
map:
|
|
105
|
-
|
|
106
|
-
rules:
|
|
107
|
-
# note[5]
|
|
108
|
-
- pattern: \u0902(?=[कखगघ]) # ं before क, ख, ग, and घ
|
|
109
|
-
result: ṅ
|
|
110
|
-
- pattern: \u0902(?=[चछजझ]) # ं before च, छ, ज, and झ
|
|
111
|
-
result: ñ
|
|
112
|
-
- pattern: \u0902(?=[टठडढ]) # ं before ट, ठ, ड, and ढ
|
|
113
|
-
result: ṇ
|
|
114
|
-
- pattern: \u0902(?=[तथदध]) # ं before त, थ, द, and ध
|
|
115
|
-
result: n
|
|
116
|
-
|
|
117
|
-
characters:
|
|
118
|
-
|
|
119
|
-
# Vowels and Diphthongs
|
|
120
|
-
|
|
121
|
-
'अ': 'a'
|
|
122
|
-
'आ': 'ā'
|
|
123
|
-
'इ': 'i'
|
|
124
|
-
'ई': 'ī'
|
|
125
|
-
'उ': 'u'
|
|
126
|
-
'ऊ': 'ū'
|
|
127
|
-
'ऋ': 'ṛi'
|
|
128
|
-
'ॠ': 'rī'
|
|
129
|
-
'ए': 'e'
|
|
130
|
-
'ऐ': 'ai'
|
|
131
|
-
'ओ': 'o'
|
|
132
|
-
'औ': 'au'
|
|
133
|
-
|
|
134
|
-
# Medials # Needed for connecting constants
|
|
135
|
-
|
|
136
|
-
'ा': "ā"
|
|
137
|
-
'ि': "i"
|
|
138
|
-
'ी': "ī"
|
|
139
|
-
'ु': "u"
|
|
140
|
-
'ू': "ū"
|
|
141
|
-
'ृ': "ṛi"
|
|
142
|
-
'ॄ': "rī"
|
|
143
|
-
'े': "e"
|
|
144
|
-
'ै': "ai"
|
|
145
|
-
'ो': "o"
|
|
146
|
-
'ौ': "au"
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
# Consonants (see Note 1)
|
|
150
|
-
|
|
151
|
-
# Gutturals
|
|
152
|
-
'क': 'k'
|
|
153
|
-
'ख': 'kh'
|
|
154
|
-
'ग': 'g'
|
|
155
|
-
'घ': 'gh'
|
|
156
|
-
'ङ': 'ṅ'
|
|
157
|
-
|
|
158
|
-
# Palatals
|
|
159
|
-
'च': 'ch'
|
|
160
|
-
'छ': 'chh'
|
|
161
|
-
'ज': 'j'
|
|
162
|
-
'झ': 'jh'
|
|
163
|
-
'ञ': 'ñ'
|
|
164
|
-
|
|
165
|
-
# Cerebrals
|
|
166
|
-
'ट': 'ṭ'
|
|
167
|
-
'ठ': 'ṭh'
|
|
168
|
-
'ड': 'ḍ'
|
|
169
|
-
'ढ': 'ḍh'
|
|
170
|
-
'ण': 'ṇ'
|
|
171
|
-
|
|
172
|
-
# Dentals
|
|
173
|
-
'त': 't'
|
|
174
|
-
'थ': 'th'
|
|
175
|
-
'द': 'd'
|
|
176
|
-
'ध': 'dh'
|
|
177
|
-
'न': 'n'
|
|
178
|
-
|
|
179
|
-
# Labials
|
|
180
|
-
'प': 'p'
|
|
181
|
-
'फ': 'ph'
|
|
182
|
-
'ब': 'b'
|
|
183
|
-
'भ': 'bh'
|
|
184
|
-
'म': 'm'
|
|
185
|
-
|
|
186
|
-
# Semivowels
|
|
187
|
-
'य': 'y'
|
|
188
|
-
'र': 'r'
|
|
189
|
-
'ल': 'l'
|
|
190
|
-
'व': 'v' # or wa [Note#3]
|
|
191
|
-
|
|
192
|
-
# Sibilants
|
|
193
|
-
'श': 'sh'
|
|
194
|
-
'ष': 'ṣ'
|
|
195
|
-
'स': 's'
|
|
196
|
-
'क्ष': 'kṣ'
|
|
197
|
-
'त्र': 'tr'
|
|
198
|
-
'ज्ञ' : 'jñ'
|
|
199
|
-
|
|
200
|
-
# Aspirate
|
|
201
|
-
'ह': 'h'
|
|
202
|
-
|
|
203
|
-
# Anusvāra
|
|
204
|
-
'ं': 'ṃ'
|
|
205
|
-
|
|
206
|
-
# Bisarga
|
|
207
|
-
'ः': 'ḥ'
|
|
208
|
-
|
|
209
|
-
# Anunāsika
|
|
210
|
-
'ँ': '~'
|
|
211
|
-
|
|
212
|
-
'ॅ': 'r'
|
|
213
|
-
|
|
214
|
-
# halanta
|
|
215
|
-
'्': 'a'
|
|
216
|
-
|
|
217
|
-
# Abagraha
|
|
218
|
-
'ऽ': '’' # (apostrophe)
|
|
219
|
-
|
|
220
|
-
# Numerals / सङ्ख्या
|
|
221
|
-
'०': '0'
|
|
222
|
-
'१': '1'
|
|
223
|
-
'२': '2'
|
|
224
|
-
'३': '3'
|
|
225
|
-
'४': '4'
|
|
226
|
-
'५': '5'
|
|
227
|
-
'६': '6'
|
|
228
|
-
'७': '7'
|
|
229
|
-
'८': '8'
|
|
230
|
-
'९': '9'
|