interscript 0.1.7 → 2.1.0b1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +116 -0
- data/bin/console +14 -0
- data/bin/interscript +5 -0
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/bin/setup +8 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +83 -133
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +68 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +68 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +76 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +68 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/interscript/visualize.rb +61 -0
- data/lib/interscript/visualize/group.html.erb +59 -0
- data/lib/interscript/visualize/json.rb +57 -0
- data/lib/interscript/visualize/map.html.erb +46 -0
- data/lib/interscript/visualize/nodes.rb +89 -0
- data/requirements.txt +1 -0
- metadata +78 -416
- data/README.adoc +0 -298
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript/fs.rb +0 -69
- data/lib/interscript/mapping.rb +0 -142
- data/lib/interscript/opal.rb +0 -57
- data/lib/interscript/opal/entrypoint.rb +0 -12
- data/lib/interscript/opal/map_translate.rb +0 -7
- data/lib/interscript/opal/maps.js.erb +0 -10
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38916
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -513
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1287
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -165
- data/maps/alalc-asm-Deva-Latn-2012.yaml +0 -40
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -129
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -98
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -628
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -626
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +0 -266
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +0 -64
- data/maps/alalc-hin-Deva-Latn-1997.yaml +0 -211
- data/maps/alalc-hin-Deva-Latn-2011.yaml +0 -47
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -150
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -98
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +0 -303
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +0 -73
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -189
- data/maps/alalc-mar-Deva-Latn-2011.yaml +0 -45
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +0 -220
- data/maps/alalc-pan-Guru-Latn-1997.yaml +0 -256
- data/maps/alalc-pan-Guru-Latn-2011.yaml +0 -78
- data/maps/alalc-per-Arab-Latn-1997.yaml +0 -375
- data/maps/alalc-pli-Deva-Latn-2012.yaml +0 -144
- data/maps/alalc-pra-Deva-Latn-2012.yaml +0 -47
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -225
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-san-Deva-Latn-2012.yaml +0 -172
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +0 -292
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +0 -71
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -118
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-tam-Taml-Latn-1997.yaml +0 -62
- data/maps/alalc-tam-Taml-Latn-2011.yaml +0 -58
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -145
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -35
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -532
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -596
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -188
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -289
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -119
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -42
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +0 -184
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -705
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -23
- data/maps/bgnpcgn-fas-Arab-Latn-1956.yaml +0 -96
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -131
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -163
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +0 -223
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -230
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +0 -336
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +0 -639
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +0 -459
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +0 -168
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -318
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -170
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +0 -220
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +0 -240
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -119
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +0 -127
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +0 -82
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +0 -181
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -172
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +0 -899
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +0 -100
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +0 -145
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +0 -84
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +0 -119
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +0 -75
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +0 -63
- data/maps/din-san-Deva-Latn-33904-2018.yaml +0 -338
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +0 -213
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -47
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -92
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -190
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +0 -157
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-fas-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +0 -75
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +0 -175
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -613
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -44
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +0 -220
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +0 -61
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -66
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +0 -220
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +0 -145
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +0 -240
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +0 -226
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +0 -281
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +0 -75
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +0 -87
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +0 -193
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +0 -222
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +0 -73
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +0 -74
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +0 -219
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +0 -55
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +0 -59
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +0 -366
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +0 -159
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +0 -220
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -909
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +0 -163
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +0 -200
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -807
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/odni-ara-Arab-Latn-2015.yaml +0 -425
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-che-Cyrl-Latn-2015.yaml +0 -169
- data/maps/odni-fas-Arab-Latn-2015.yaml +0 -406
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-kor-Hang-Latn-2015.yaml +0 -375
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-per-Arab-Latn-2015.yaml +0 -228
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -183
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -80
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24763
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +0 -389
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +0 -354
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -283
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -197
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +0 -75
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +0 -192
- data/maps/un-amh-Ethi-Latn-2016.yaml +0 -602
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +0 -780
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-hin-Deva-Latn-2016.yaml +0 -222
- data/maps/un-mar-Deva-Latn-2016.yaml +0 -91
- data/maps/un-mon-Mong-Latn-general-2013.yaml +0 -264
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +0 -264
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -350
- data/maps/un-nep-Deva-Latn-2013.yaml +0 -74
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -53
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +0 -162
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +0 -221
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +0 -43
- data/maps/var-mon-Mong-Latn-1930.yaml +0 -102
- data/maps/var-mon-Mong-Latn-lessing.yaml +0 -272
- data/maps/var-mon-Mong-Latn-vpmc.yaml +0 -274
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +0 -30
- data/maps/var-san-Deva-Latn-iast-1912.yaml +0 -149
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +0 -38912
- data/spec/interscript/filenames_spec.rb +0 -384
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -29
- data/spec/spec_helper.rb +0 -3
@@ -1,31 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: un
|
3
|
-
id: 1987-tl
|
4
|
-
language: iso-639-2:ell
|
5
|
-
source_script: Grek
|
6
|
-
destination_script: Latn
|
7
|
-
name: UNGEGN Greek v4.0
|
8
|
-
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
|
-
creation_date: 1987
|
10
|
-
description: |
|
11
|
-
UNGEGN Romanization table for Greek
|
12
|
-
|
13
|
-
note:
|
14
|
-
- Transliteration version (reversible). Also appears in annex B of ISO 843:1997. Originates in v1.0 of UNGEGN transliteration, 1987. This likely was the intended system in ELOT 743:1982 for transliteration, but the reversible character diacritics are missing from the document, and the document does not indicate what there was supposed to be.
|
15
|
-
|
16
|
-
tests:
|
17
|
-
|
18
|
-
- source: |
|
19
|
-
Ένα πράμα μόνον με παρακίνησε κι εμένα να γράψω ότι τούτην την πατρίδα την έχομεν όλοι μαζί, και σοφοί κι αμαθείς και πλούσιοι και φτωχοί και πολιτικοί και στρατιωτικοί και οι πλέον μικρότεροι άνθρωποι· όσοι αγωνιστήκαμεν, αναλόγως ο καθείς, έχομεν να ζήσομεν εδώ. Το λοιπόν δουλέψαμεν όλοι μαζί, να την φυλάμεν κι όλοι μαζί και να μην λέγει ούτε ο δυνατός «εγώ» ούτε ο αδύνατος. Ξέρετε πότε να λέγει ο καθείς «εγώ»; Όταν αγωνιστεί μόνος του και φκιάσει ή χαλάσει, να λέγει «εγώ»· όταν όμως αγωνίζονται πολλοί και φκιάνουν, τότε να λένε «εμείς». Είμαστε εις το «εμείς» κι όχι εις το «εγώ». Και εις το εξής να μάθομεν γνώση, αν θέλομεν να φκιάσομεν χωριόν, να ζήσομεν όλοι μαζί.
|
20
|
-
|
21
|
-
Γιάννης Μακρυγιάννης.
|
22
|
-
|
23
|
-
expected: |
|
24
|
-
Éna práma mónon me parakíni̱se ki eména na grápso̱ óti toúti̱n ti̱n patrída ti̱n échomen óloi mazí, kai sofoí ki amatheís kai ploúsioi kai fto̱choí kai politikoí kai stratio̱tikoí kai oi pléon mikróteroi ánthro̱poi; ósoi ago̱nistí̱kamen, analógo̱s o katheís, échomen na zí̱somen edó̱. To loipón doulépsamen óloi mazí, na ti̱n fylámen ki óloi mazí kai na mi̱n légei oúte o dynatós «egó̱» oúte o adýnatos. Xérete póte na légei o katheís «egó̱»? Ótan ago̱nisteí mónos tou kai fkiásei í̱ chalásei, na légei «egó̱»; ótan ómo̱s ago̱nízontai polloí kai fkiánoun, tóte na léne «emeís». Eímaste eis to «emeís» ki óchi eis to «egó̱». Kai eis to exí̱s na máthomen gnó̱si̱, an thélomen na fkiásomen cho̱rión, na zí̱somen óloi mazí.
|
25
|
-
|
26
|
-
Giánni̱s Makrygiánni̱s.
|
27
|
-
|
28
|
-
map:
|
29
|
-
character_separator: ""
|
30
|
-
word_separator: " "
|
31
|
-
inherit: "elot-ell-Grek-Latn-743-1982-tl"
|
@@ -1,19 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: un
|
3
|
-
id: 1987-tl
|
4
|
-
language: iso-639-2:ell
|
5
|
-
source_script: Grek
|
6
|
-
destination_script: Latn
|
7
|
-
name: UNGEGN Greek v4.0
|
8
|
-
url: http://www.eki.ee/wgrs/rom1_el.htm
|
9
|
-
creation_date: 1987
|
10
|
-
description: |
|
11
|
-
UNGEGN Romanization table for Greek
|
12
|
-
|
13
|
-
note:
|
14
|
-
- Transcription version
|
15
|
-
|
16
|
-
map:
|
17
|
-
character_separator: ""
|
18
|
-
word_separator: " "
|
19
|
-
inherit: "elot-ell-Grek-Latn-743-1982-ts"
|
@@ -1,222 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: ungegn
|
3
|
-
id: 2016
|
4
|
-
language: iso-639-2:hin
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Hindi Romanization, 1972
|
8
|
-
url: https://www.eki.ee/wgrs/rom1_hi.pdf
|
9
|
-
creation_date: 1972
|
10
|
-
confirmation_date: 2016
|
11
|
-
description: |
|
12
|
-
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
|
13
|
-
(III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
|
14
|
-
published in volume II of the conference reports.
|
15
|
-
|
16
|
-
There is no evidence of the use of the system either in India or in international cartographic
|
17
|
-
products. It was stated in 1987 that the appropriate resolution had not been implemented in
|
18
|
-
India and the Hunterian system was still in use in large-scale mapping
|
19
|
-
|
20
|
-
Hindi uses the alphasyllabic script Devanāgarī whereby each character represents a syllable
|
21
|
-
rather than one sound. Vowels and diphthongs are marked in two ways: as independent
|
22
|
-
characters (used syllable-initially) and in an abbreviated form, to denote vowels after
|
23
|
-
consonants. The romanization table is unambiguous but the user would have to recognize
|
24
|
-
many ligatures not given in the original table (only three are given). The system is mostly
|
25
|
-
reversible but there may exist some ambiguities in the romanization of vowels (independent
|
26
|
-
vs. abbreviated characters) and consonants
|
27
|
-
|
28
|
-
notes:
|
29
|
-
- |
|
30
|
-
It is recommended that the vowel अ (a) should always be romanized except when it ends a
|
31
|
-
name. If a name ends with a consonant, the consonant should carry a sub-macron. Such
|
32
|
-
cases, however, will be very rare. For example, कानपुर Kānapur (not Kānapura), जगत्
|
33
|
-
Jagaṯ.
|
34
|
-
- |
|
35
|
-
If each letter of a digraph or any two parts of a trigraph has a distinct independent sound
|
36
|
-
then it should be indicated by a hyphen, thus d-h.
|
37
|
-
|
38
|
-
tests:
|
39
|
-
- source: "परिपक्क"
|
40
|
-
expected: "paraipakka"
|
41
|
-
- source: "जगत्"
|
42
|
-
expected: "jagat"
|
43
|
-
- source: "संख्या"
|
44
|
-
expected: "saṁkhyaā"
|
45
|
-
- source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
|
46
|
-
expected: "gaṁbhaīra maraījaoṁ kae maāmalae maeṁ bhaārata daūsarae naṁbara para"
|
47
|
-
- source: "कोरोना अपडेट्स"
|
48
|
-
expected: "kaoraonaā apaḍaeṭsa"
|
49
|
-
- source: "सीडीसी चीफ का बयान अहम"
|
50
|
-
expected: "saīḍaīsaī chaīpha kaā bayaāna ahama"
|
51
|
-
- source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
|
52
|
-
expected: "gaūgala plae sṭaora para paeṭaīema kaī vaāpasaī"
|
53
|
-
- source: "भारत में गैंबलिंग की इजाजत नहीं"
|
54
|
-
expected: "bhaārata maeṁ gaaiṁbalaiṁga kaī ijaājata nahaīṁ"
|
55
|
-
- source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
|
56
|
-
expected: "kaoraonaā vaaiksaīna mauddae para ghairae raāṣhṭrapatai; jao baāiḍaena baolae- maujhae aura daesha kao vaaijñaānaikaoṁ para bharaosaā haai, ḍaonaālḍa ṭrampa para nahaīṁ"
|
57
|
-
- source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
|
58
|
-
expected: "gaūgala kaī kaārravaāī para paeṭaīema nae kahaā thaā kai aipa kao asthaāyaī taaura para plae-sṭaora sae haṭaāyaā gayaā haai, āpakae paaisae saurakṣhaita haaiṁ"
|
59
|
-
map:
|
60
|
-
|
61
|
-
characters:
|
62
|
-
|
63
|
-
# I. Independent vowel characters
|
64
|
-
'अ': 'a'
|
65
|
-
'आ': 'ā'
|
66
|
-
'इ': 'i'
|
67
|
-
'ई': 'ī'
|
68
|
-
'उ': 'u'
|
69
|
-
'ऊ': 'ū'
|
70
|
-
'ऋ': 'ṛ'
|
71
|
-
'ॠ': 'ṝ'
|
72
|
-
'ऌ': 'l̤'
|
73
|
-
'ए': 'e'
|
74
|
-
'ऐ': 'ai'
|
75
|
-
'ओ': 'o'
|
76
|
-
'औ': 'au'
|
77
|
-
|
78
|
-
# II. Abbreviated vowel characters
|
79
|
-
|
80
|
-
'ा': "ā" # का
|
81
|
-
'ॉ': "ā̆ " # additional mark: कॉ
|
82
|
-
'ि': "i" # कि i
|
83
|
-
'ी': "ī" # की
|
84
|
-
'ु': "u" # कु
|
85
|
-
'ू': "ū" # कू
|
86
|
-
'ृ': "ṛ" # कृ
|
87
|
-
'े': "e" # के
|
88
|
-
'ै': "ai" # कै
|
89
|
-
'ो': "o" # को
|
90
|
-
'ौ': "au" # कौ
|
91
|
-
|
92
|
-
|
93
|
-
# Consonants (see Note 1)
|
94
|
-
|
95
|
-
# Gutturals
|
96
|
-
'क': 'ka'
|
97
|
-
'ख': 'kha'
|
98
|
-
'ग': 'ga'
|
99
|
-
'घ': 'gha'
|
100
|
-
'ङ': 'ṅa'
|
101
|
-
|
102
|
-
# Palatals
|
103
|
-
'च': 'cha'
|
104
|
-
'छ': 'chha'
|
105
|
-
'ज': 'ja'
|
106
|
-
'झ': 'jha'
|
107
|
-
'ञ': 'ña'
|
108
|
-
|
109
|
-
# Cerebrals
|
110
|
-
'ट': 'ṭa'
|
111
|
-
'ठ': 'ṭha'
|
112
|
-
'ड': 'ḍa'
|
113
|
-
'ढ': 'ḍha'
|
114
|
-
'ण': 'ṇa'
|
115
|
-
|
116
|
-
# Dentals
|
117
|
-
'त': 'ta'
|
118
|
-
'थ': 'tha'
|
119
|
-
'द': 'da'
|
120
|
-
'ध': 'dha'
|
121
|
-
'न': 'na'
|
122
|
-
|
123
|
-
# Labials
|
124
|
-
'प': 'pa'
|
125
|
-
'फ': 'pha'
|
126
|
-
'ब': 'ba'
|
127
|
-
'भ': 'bha'
|
128
|
-
'म': 'ma'
|
129
|
-
|
130
|
-
# Semivowels
|
131
|
-
'य': 'ya'
|
132
|
-
'र': 'ra'
|
133
|
-
'ल': 'la'
|
134
|
-
'व': 'va'
|
135
|
-
|
136
|
-
# Sibilants
|
137
|
-
'श': 'sha'
|
138
|
-
'ष': 'ṣha'
|
139
|
-
'स': 'sa'
|
140
|
-
|
141
|
-
# Dotted variants
|
142
|
-
'क़': 'qa'
|
143
|
-
'ख़': 'ḳha'
|
144
|
-
'ग़': 'ġa'
|
145
|
-
'ज़': 'za'
|
146
|
-
'ड़': 'ṙa'
|
147
|
-
'ढ़': 'ṙha'
|
148
|
-
'फ़': 'fa'
|
149
|
-
|
150
|
-
|
151
|
-
# Aspirate
|
152
|
-
'ह': 'ha'
|
153
|
-
|
154
|
-
# Anusvāra
|
155
|
-
'ं': 'ṁ'
|
156
|
-
|
157
|
-
# Anunāsika
|
158
|
-
'ँ': 'm̐'
|
159
|
-
|
160
|
-
# halanta
|
161
|
-
'्': ''
|
162
|
-
|
163
|
-
# bisharga
|
164
|
-
'ः' : 'ḥ'
|
165
|
-
|
166
|
-
#V. Ligatures(To cover all Ligatures at unicode)
|
167
|
-
# Implemnting Pronunciation without a vowel: क् k.
|
168
|
-
|
169
|
-
# Gutturals
|
170
|
-
'क्': 'k'
|
171
|
-
'ख्': 'kh'
|
172
|
-
'ग्': 'g'
|
173
|
-
'घ्': 'gh'
|
174
|
-
'ङ्': 'ṅ'
|
175
|
-
|
176
|
-
# Palatals
|
177
|
-
'च्': 'ch'
|
178
|
-
'छ्': 'chh'
|
179
|
-
'ज्': 'j'
|
180
|
-
'झ्': 'jh'
|
181
|
-
'ञ्': 'ñ'
|
182
|
-
|
183
|
-
# Cerebrals
|
184
|
-
'ट्': 'ṭ'
|
185
|
-
'ठ्': 'ṭh'
|
186
|
-
'ड्': 'ḍ'
|
187
|
-
'ढ्': 'ḍh'
|
188
|
-
'ण्': 'ṇ'
|
189
|
-
|
190
|
-
# Dentals
|
191
|
-
'त्': 't'
|
192
|
-
'थ्': 'th'
|
193
|
-
'द्': 'd'
|
194
|
-
'ध्': 'dh'
|
195
|
-
'न्': 'n'
|
196
|
-
|
197
|
-
# Labials
|
198
|
-
'प्': 'p'
|
199
|
-
'फ्': 'ph'
|
200
|
-
'ब्': 'b'
|
201
|
-
'भ्': 'bh'
|
202
|
-
'म्': 'm'
|
203
|
-
|
204
|
-
# Semivowels
|
205
|
-
'य्': 'y'
|
206
|
-
'र्': 'r'
|
207
|
-
'ल्': 'l'
|
208
|
-
'व्': 'v'
|
209
|
-
|
210
|
-
# Sibilants
|
211
|
-
'श्': 'sh'
|
212
|
-
'ष्': 'ṣh'
|
213
|
-
'स्': 's'
|
214
|
-
|
215
|
-
# Dotted variants
|
216
|
-
'क़्': 'q'
|
217
|
-
'ख़्': 'ḳh'
|
218
|
-
'ग़्': 'ġ'
|
219
|
-
'ज़्': 'z'
|
220
|
-
'ड़्': 'ṙ'
|
221
|
-
'ढ़्': 'ṙh'
|
222
|
-
'फ़्': 'f'
|
@@ -1,91 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: ungegn
|
3
|
-
id: 2016
|
4
|
-
language: iso-639-2:hin
|
5
|
-
source_script: Deva
|
6
|
-
destination_script: Latn
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Marathi Romanization, 1972
|
8
|
-
url: https://www.eki.ee/wgrs/rom1_mr.pdf
|
9
|
-
creation_date: 1972
|
10
|
-
confirmation_date: 2016
|
11
|
-
description: |
|
12
|
-
The United Nations recommended system was approved in 1972 (II/11) and amended in 1977
|
13
|
-
(III/12), based on a report prepared by D. N. Sharma. The tables and their corrections were
|
14
|
-
published in volume II of the conference reports
|
15
|
-
|
16
|
-
There is no evidence of the use of the system either in India or in international cartographic
|
17
|
-
products.
|
18
|
-
|
19
|
-
Marathi (Marāṭhī) uses the alphasyllabic script Devanāgarī.
|
20
|
-
|
21
|
-
notes:
|
22
|
-
- |
|
23
|
-
Additional characters (absent in Hindi):
|
24
|
-
ळ ḷa
|
25
|
-
ऍ ă (abbreviated: कॅ kă)
|
26
|
-
|
27
|
-
- |
|
28
|
-
Ligatures may be formed with r as the first component: 'ऱ्य': 'rya' 'ऱ्ह': 'rha'
|
29
|
-
- |
|
30
|
-
Typical are ligatures ending in h: न्ह nh, म्ह mh, ल्ह lh, व्ह vh.
|
31
|
-
- |
|
32
|
-
The following independent characters are sometimes used: अि i, अी ī, अु u, अू ū, अे e, अै ai.
|
33
|
-
|
34
|
-
tests:
|
35
|
-
- source: "परिपक्क"
|
36
|
-
expected: "paraipakka"
|
37
|
-
- source: "ठाणे - जिल्ह्यात बुधवारी एक हजार रुग्णांची वाढ, तर जणांच्या मृत्यूची नोंद"
|
38
|
-
expected: "ṭhaāṇae - jailhayaāta baudhavaāraī eka hajaāra raugṇaāṁchaī vaāḍha, tara jaṇaāṁchyaā maṛtyaūchaī naoṁda"
|
39
|
-
- source: "एकता कपूर पुन्हा अडकली वादात, वेबसीरिजमधल्या 'त्या' सीनमुळे जमावाची घरावर दगडफेक"
|
40
|
-
expected: "ekataā kapaūra paunhaā aḍakalaī vaādaāta, vaebasaīraijamadhalyaā 'tyaā' saīnamauḷae jamaāvaāchaī gharaāvara dagaḍaphaeka"
|
41
|
-
- source: "जाणून घ्या, बीएमसीच्या अधिकाऱ्यांनी कंगना राणौतच्या ऑफिसमधले नक्की काय- काय तोडलं"
|
42
|
-
expected: "jaāṇaūna ghyaā, baīemasaīchyaā adhaikaāryaāṁnaī kaṁganaā raāṇaautachyaā ôphaisamadhalae nakkaī kaāya- kaāya taoḍalaṁ"
|
43
|
-
- source: "कंगना मुंबईत दाखल होण्यापूर्वी 'मातोश्री'वरून फर्मान सुटले; प्रवक्त्यांना सक्त आदेश"
|
44
|
-
expected: "kaṁganaā mauṁbaīta daākhala haoṇyaāpaūrvaī 'maātaoshraī'varaūna pharmaāna sauṭalae; pravaktyaāṁnaā sakta ādaesha"
|
45
|
-
- source: "मराठा आरक्षणास तात्पुरती स्थगिती; सर्वोच्च न्यायालयाचा निर्णय"
|
46
|
-
expected: "maraāṭhaā ārakṣhaṇaāsa taātpaurataī sthagaitaī; sarvaochcha nyaāyaālayaāchaā nairṇaya"
|
47
|
-
- source: "भारताच्या तिन्ही लशींचा पहिला टप्पा यशस्वी, वाचा कधी येणार बाजारात"
|
48
|
-
expected: "bhaārataāchyaā tainhaī lashaīṁchaā pahailaā ṭappaā yashasvaī, vaāchaā kadhaī yaeṇaāra baājaāraāta"
|
49
|
-
- source: "रुग्णवाढीमुळे खाटांची चणचण"
|
50
|
-
expected: "raugṇavaāḍhaīmauḷae khaāṭaāṁchaī chaṇachaṇa"
|
51
|
-
- source: "पीएम स्वनिधी कर्ज योजनेला मुंबईतून अल्प प्रतिसाद"
|
52
|
-
expected: "paīema svanaidhaī karja yaojanaelaā mauṁbaītaūna alpa prataisaāda"
|
53
|
-
- source: "सांताक्रूझ-चेंबूर लिंक रोडवरील उन्नत मार्गाला स्थगिती"
|
54
|
-
expected: "saāṁtaākraūjha-chaeṁbaūra laiṁka raoḍavaraīla unnata maārgaālaā sthagaitaī"
|
55
|
-
- source: "संपादक अर्णब गोस्वामी यांच्याविरूद्ध खडक पोलिस ठाण्यात तक्रार"
|
56
|
-
expected: "saṁpaādaka arṇaba gaosvaāmaī yaāṁchyaāvairaūddha khaḍaka paolaisa ṭhaāṇyaāta takraāra"
|
57
|
-
- source: "करणाऱ्या मुलांना अनुक्रमे प्ले ग्रूप"
|
58
|
-
expected: "karaṇaāryaā maulaāṁnaā anaukramae plae graūpa"
|
59
|
-
- source: "राज्यातील शाळा दिवाळीपर्यंत बंद, मंत्र्यांच्या बैठकीत निर्णय, शिक्षकांची जबाबदारी वाढली"
|
60
|
-
expected: "raājyaātaīla shaāḷaā daivaāḷaīparyaṁta baṁda, maṁtryaāṁchyaā baaiṭhakaīta nairṇaya, shaikṣhakaāṁchaī jabaābadaāraī vaāḍhalaī"
|
61
|
-
|
62
|
-
map:
|
63
|
-
inherit: "un-hin-Deva-Latn-2016"
|
64
|
-
|
65
|
-
rules:
|
66
|
-
# note[3]
|
67
|
-
- pattern: (?<=)\U+0939(?=\b)
|
68
|
-
result: "h"
|
69
|
-
|
70
|
-
characters:
|
71
|
-
|
72
|
-
# Note 1
|
73
|
-
'ळ': 'ḷa'
|
74
|
-
'ऍ': 'ă'
|
75
|
-
|
76
|
-
# Note 2
|
77
|
-
'ऱ': 'r' # used for making Ligatures 'ऱ्य': 'rya' 'ऱ्ह': 'rha'
|
78
|
-
|
79
|
-
# Note 4
|
80
|
-
'अि': 'i'
|
81
|
-
'अी': 'ī'
|
82
|
-
'अु': 'u'
|
83
|
-
'अू': 'ū'
|
84
|
-
'अे': 'e'
|
85
|
-
'अै': 'ai'
|
86
|
-
|
87
|
-
'ॲ': 'ê'
|
88
|
-
'ऑ': 'ô'
|
89
|
-
|
90
|
-
|
91
|
-
|
@@ -1,264 +0,0 @@
|
|
1
|
-
---
|
2
|
-
authority_id: un
|
3
|
-
id: general-2013
|
4
|
-
language: iso-639-2:mon
|
5
|
-
source_script: Mong
|
6
|
-
destination_script: Latn
|
7
|
-
name: Mongolian Romanization in China, Version 4.0 (general)
|
8
|
-
url: http://www.eki.ee/wgrs/rom1_mnc.htm
|
9
|
-
creation_date: 2013-09
|
10
|
-
description: |
|
11
|
-
The United Nations resolution III/8 in 1977 recognized the Scheme for
|
12
|
-
a Chinese Phonetic Alphabet (Pinyin) as China’s official Roman alphabet
|
13
|
-
scheme and recommended the alphabet as the international system for the
|
14
|
-
romanization of Chinese geographical names. In China Mongolian
|
15
|
-
geographical names are transcribed directly from the Mongolian script
|
16
|
-
into Pinyin. The scheme was published in Toponymic Guidelines for Map
|
17
|
-
and Other Editors: China, 1982.
|
18
|
-
|
19
|
-
The system is used in China and in international cartographic
|
20
|
-
products.
|
21
|
-
|
22
|
-
Mongolian uses a vertical script. Transcription of Mongolian names is
|
23
|
-
made from their proper pronunciation based on the written form of the
|
24
|
-
Mongolian language and Qahar vernacular, with Zhenglan as its
|
25
|
-
representative pronunciation. Due to the complex nature of the script
|
26
|
-
the romanization scheme is not reversible, e.g. the name of the city
|
27
|
-
Hohhot is written ᠬᠥᠬᠡᠬᠣᠲᠠ but may be transliterated as kökeqota.
|
28
|
-
|
29
|
-
notes:
|
30
|
-
- The long and short Mongolian vowels are not distinguished in the
|
31
|
-
spelling for general use, but in recording the pronunciation of
|
32
|
-
place-names, the long vowel is represented by duplication.
|
33
|
-
- Where two Roman equivalents are given, the second (in brackets) is
|
34
|
-
used for recording the pronunciation of place-names while the first
|
35
|
-
form is for general use.
|
36
|
-
- In the table only word-initial character variants are shown.
|
37
|
-
Depending on the position in the word many variants of the characters
|
38
|
-
are used as well as some ligatures. These features are not covered here.
|
39
|
-
- For technical reasons the characters of the Mongolian script are
|
40
|
-
turned 90˚ anti-clockwise.
|
41
|
-
|
42
|
-
implementation_notes:
|
43
|
-
- A separated final form of vowels a or e is common, and can appear at the end
|
44
|
-
of a word, word stem, or suffix. This form requires a final-shaped preceding
|
45
|
-
consonant and an inter-word gap in between. The vowels themselves appear as ᠠ,
|
46
|
-
and with consonants as ᠬᠠ q‑a, ᠷᠠ r‑a/r‑e, etc. This gap can be transliterated
|
47
|
-
with a hyphen. In digital typesetting, these forms are triggered by inserting
|
48
|
-
a U+180E MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
|
49
|
-
and vowel.
|
50
|
-
- All case suffixes, as well as any plural suffixes consisting of one or two
|
51
|
-
syllables are likewise separated by a preceding and hyphen-transliterated gap.
|
52
|
-
In digital typesetting, this gap is represented by a U+202F NARROW NO-BREAK SPACE
|
53
|
-
(HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
|
54
|
-
Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
|
55
|
-
as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
|
56
|
-
'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
|
57
|
-
medial- (vowels), or variant-shaped form.
|
58
|
-
|
59
|
-
tests:
|
60
|
-
- source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
|
61
|
-
expected: ordos hota
|
62
|
-
- source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
|
63
|
-
expected: bayannagur hota
|
64
|
-
- source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
|
65
|
-
expected: ulaganhota
|
66
|
-
- source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
|
67
|
-
expected: hoolia goul hota
|
68
|
-
- source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
|
69
|
-
expected: eriyen hota
|
70
|
-
- source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
|
71
|
-
expected: rasiyan hota
|
72
|
-
- source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
|
73
|
-
expected: bagarin baragun hosigu
|
74
|
-
- source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
|
75
|
-
expected: bagarin jegun hosigu
|
76
|
-
- source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
|
77
|
-
expected: tungliyou hota
|
78
|
-
- source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
|
79
|
-
expected: sili-yin hota
|
80
|
-
- source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
|
81
|
-
expected: horin ger siyan
|
82
|
-
- source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
|
83
|
-
expected: uda togorig
|
84
|
-
- source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
|
85
|
-
expected: uhai hota
|
86
|
-
- source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
|
87
|
-
expected: hayinan togorig
|
88
|
-
- source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
|
89
|
-
expected: hayirub-un tohoi togorig
|
90
|
-
- source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
|
91
|
-
expected: ulaganqab hota
|
92
|
-
- source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
|
93
|
-
expected: jining togorig
|
94
|
-
- source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
|
95
|
-
expected: fwngjwe hota
|
96
|
-
- source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
|
97
|
-
expected: juwezi siyan
|
98
|
-
- source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
|
99
|
-
expected: huwade siyan
|
100
|
-
- source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
|
101
|
-
expected: xangdu siyan
|
102
|
-
- source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
|
103
|
-
expected: singhe siyan
|
104
|
-
- source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
|
105
|
-
expected: liyangqang siyan
|
106
|
-
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
|
107
|
-
expected: qahar baragun garun emunedu hosigu
|
108
|
-
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
|
109
|
-
expected: qahar baragun garun dumdadu hosigu
|
110
|
-
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
|
111
|
-
expected: qahar baragun garun hoyitu hosigu
|
112
|
-
- source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
|
113
|
-
expected: dorbed hosigu
|
114
|
-
- source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
|
115
|
-
expected: bugutu hota
|
116
|
-
- source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
|
117
|
-
expected: hondelen togorig
|
118
|
-
- source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
|
119
|
-
expected: dunghe togorig
|
120
|
-
- source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
|
121
|
-
expected: qingxan togorig
|
122
|
-
- source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
|
123
|
-
expected: siguyitu togorig
|
124
|
-
- source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
|
125
|
-
expected: jiu yuwan togorig
|
126
|
-
- source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
|
127
|
-
expected: guyang siyan
|
128
|
-
- source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
|
129
|
-
expected: tumed jegun hosigu
|
130
|
-
- source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
|
131
|
-
expected: tumed baragun hosigu
|
132
|
-
- source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
|
133
|
-
expected: darhan muumingg᠋an holbogatu hosigu
|
134
|
-
- source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
|
135
|
-
expected: hesigten hosigu
|
136
|
-
- source: ᠰᠢᠨᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
|
137
|
-
expected: sin-e bargu jegun hosigu
|
138
|
-
- source: ᠰᠢᠨᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
|
139
|
-
expected: sin-e bargu baragun hosigu
|
140
|
-
- source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
|
141
|
-
expected: otog hosigu
|
142
|
-
- source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
|
143
|
-
expected: d᠋ungxeng togorig
|
144
|
-
- source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
|
145
|
-
expected: dalad hosigu
|
146
|
-
- source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
|
147
|
-
expected: jegungar hosigu
|
148
|
-
- source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
|
149
|
-
expected: otog-un emunedu hosigu
|
150
|
-
- source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
|
151
|
-
expected: hanggin hosigu
|
152
|
-
- source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
|
153
|
-
expected: uusin hosigu
|
154
|
-
- source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
|
155
|
-
expected: ejin horog-a hosigu
|
156
|
-
- source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
|
157
|
-
expected: jalan ai᠌l hota
|
158
|
-
- source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
|
159
|
-
expected: yagsi hota
|
160
|
-
- source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
|
161
|
-
expected: manjuur hota
|
162
|
-
- source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
|
163
|
-
expected: hayilar togorig
|
164
|
-
- source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
|
165
|
-
expected: horqin togorig
|
166
|
-
- source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
|
167
|
-
expected: kayilu siyan
|
168
|
-
- source: ᠬᠦᠷᠢᠶᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
|
169
|
-
expected: huriy-e hosigu
|
170
|
-
- source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
|
171
|
-
expected: naiman hosigu
|
172
|
-
- source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
|
173
|
-
expected: jarud hosigu
|
174
|
-
- source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
|
175
|
-
expected: horqin baragun garun dumdadu hosigu
|
176
|
-
- source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
|
177
|
-
expected: horqin jegun garun dumdadu hosigu
|
178
|
-
- source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
|
179
|
-
expected: horqin jegun garun hoyitu hosigu
|
180
|
-
- source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
|
181
|
-
expected: ulaganhada hota
|
182
|
-
- source: ᠰᠡᠷᠡᠴᠢ # Salaqi
|
183
|
-
expected: sereqi
|
184
|
-
- source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
|
185
|
-
expected: gegen goul hota
|
186
|
-
- source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
|
187
|
-
expected: alaxa jegun hosigu
|
188
|
-
- source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
|
189
|
-
expected: alaxa baragun hosigu
|
190
|
-
- source: ᠡᠵᠡᠨᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
|
191
|
-
expected: ejen-e hosigu
|
192
|
-
- source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
|
193
|
-
expected: hobegetu sir-a hosigu
|
194
|
-
- source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
|
195
|
-
expected: uyuwan siyan
|
196
|
-
- source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
|
197
|
-
expected: uquwan siyan
|
198
|
-
- source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
|
199
|
-
expected: tuqiuwan siyan
|
200
|
-
- source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
|
201
|
-
expected: ningqeng siyan
|
202
|
-
- source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
|
203
|
-
expected: linsi siyan
|
204
|
-
- source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
|
205
|
-
expected: linhe togorig
|
206
|
-
- source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
|
207
|
-
expected: haraqin hosigu
|
208
|
-
- source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
|
209
|
-
expected: d᠋engkeu siyan
|
210
|
-
- source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
|
211
|
-
expected: auhan hosigu
|
212
|
-
- source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
|
213
|
-
expected: qing xui he siyan
|
214
|
-
- source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
|
215
|
-
expected: hodong arad-un togorig
|
216
|
-
- source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
|
217
|
-
expected: sayihan togorig
|
218
|
-
- source: ᠰᠢᠨᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
|
219
|
-
expected: sin-e hota togorig
|
220
|
-
- source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
|
221
|
-
expected: hayirub-un tohoi togorig
|
222
|
-
- source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
|
223
|
-
expected: sung xan togorig
|
224
|
-
- source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
|
225
|
-
expected: hung xan togorig
|
226
|
-
- source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
|
227
|
-
expected: arun hosigu
|
228
|
-
- source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
|
229
|
-
expected: yuwan boo xan togorig
|
230
|
-
- source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
|
231
|
-
expected: silugun hobegetu qagan hosigu
|
232
|
-
- source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
|
233
|
-
expected: silugun hohe hosigu
|
234
|
-
- source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
|
235
|
-
expected: urad-un dumdadu hosigu
|
236
|
-
- source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
|
237
|
-
expected: urad-un emunedu hosigu
|
238
|
-
- source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
|
239
|
-
expected: togtahu siyan
|
240
|
-
- source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
|
241
|
-
expected: tayipuse hosigu
|
242
|
-
- source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
|
243
|
-
expected: soned jegun hosigu
|
244
|
-
- source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
|
245
|
-
expected: soned baragun hosigu
|
246
|
-
- source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
|
247
|
-
expected: ongnigud hosigu
|
248
|
-
- source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
|
249
|
-
expected: jalaid hosigu
|
250
|
-
- source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
|
251
|
-
expected: hanggin hoyitu hosigu
|
252
|
-
- source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
|
253
|
-
expected: jegun ujumuqin hosigu
|
254
|
-
- source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
|
255
|
-
expected: aru horqin hosigu
|
256
|
-
- source: ᠠᠪᠠᠭᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
|
257
|
-
expected: abag-a hosigu
|
258
|
-
- source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
|
259
|
-
expected: buriyad
|
260
|
-
- source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
|
261
|
-
expected: ulaganbagatur
|
262
|
-
|
263
|
-
map:
|
264
|
-
inherit: sasm-mon-Mong-Latn-general-1978
|