interscript 0.1.2 → 0.1.7
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.adoc +250 -17
- data/lib/g2pwrapper.py +34 -0
- data/lib/interscript.rb +142 -20
- data/lib/interscript/command.rb +28 -0
- data/lib/interscript/fs.rb +69 -0
- data/lib/interscript/mapping.rb +142 -0
- data/lib/interscript/opal.rb +57 -0
- data/lib/interscript/opal/entrypoint.rb +12 -0
- data/lib/interscript/opal/map_translate.rb +7 -0
- data/lib/interscript/opal/maps.js.erb +10 -0
- data/lib/interscript/version.rb +1 -1
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +38916 -0
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +513 -0
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +138 -0
- data/maps/alalc-ara-Arab-Latn-1997.yaml +1287 -0
- data/maps/alalc-asm-Deva-Latn-1997.yaml +165 -0
- data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +145 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +129 -0
- data/maps/alalc-ben-Beng-Latn-2017.yaml +130 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +98 -0
- data/maps/alalc-ell-Grek-Latn-1997.yaml +628 -0
- data/maps/alalc-ell-Grek-Latn-2010.yaml +626 -0
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
- data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +111 -0
- data/maps/alalc-kat-Geor-Latn-1997.yaml +150 -0
- data/maps/alalc-kor-Hang-Latn-1997.yaml +98 -0
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +189 -0
- data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +114 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +103 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
- data/maps/alalc-pan-Guru-Latn-1997.yaml +256 -0
- data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
- data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
- data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +225 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +162 -0
- data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +118 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +135 -0
- data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
- data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +145 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +16 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +283 -0
- data/maps/{bas-rus-Cyrl-Latn-bss.yaml → bas-rus-Cyrl-Latn-2017-bss.yaml} +58 -33
- data/maps/{bas-rus-Cyrl-Latn-oss.yaml → bas-rus-Cyrl-Latn-2017-oss.yaml} +55 -35
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +292 -0
- data/maps/bgn-kor-Hang-Latn-1943.yaml +35 -0
- data/maps/bgn-kor-Kore-Latn-1943.yaml +31 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +208 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +208 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +532 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +596 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +2 -3
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +104 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +188 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +289 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +119 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +15 -65
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +705 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +23 -0
- data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -2
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +257 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +131 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +42 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +253 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +48 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +163 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +190 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +230 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +150 -65
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +170 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +80 -4
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +119 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +7456 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +159 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +156 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +184 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.yaml +181 -0
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +173 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +176 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +160 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +175 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +170 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +155 -0
- data/maps/by-bel-Cyrl-Latn-1998.yaml +172 -0
- data/maps/by-bel-Cyrl-Latn-2007.yaml +115 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
- data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +684 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +680 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +19 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +31 -0
- data/maps/ggg-kat-Geor-Latn-2002.yaml +92 -0
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +33 -0
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +201 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +190 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +38497 -0
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +109 -98
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +2 -7
- data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +6 -8
- data/maps/icao-heb-Hebr-Latn-9303.yaml +119 -125
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +2 -3
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +2 -4
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +2 -3
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +2 -4
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +323 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +613 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +44 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +66 -0
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
- data/maps/{iso-rus-Cyrl-Latn-iso9.yaml → iso-rus-Cyrl-Latn-9-1995.yaml} +4 -6
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +109 -0
- data/maps/kp-kor-Hang-Latn-2002.yaml +909 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +44820 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +411 -0
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +807 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +541 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +225 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +63 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +109 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +37 -0
- data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +144 -0
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +96 -0
- data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
- data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +258 -0
- data/maps/odni-kat-Geor-Latn-2015.yaml +87 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +136 -0
- data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +122 -0
- data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +77 -0
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +129 -0
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +142 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +148 -0
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +138 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +157 -0
- data/maps/odni-urd-Arab-Latn-2015.yaml +221 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +166 -0
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +90 -0
- data/maps/royin-tha-Thai-Latn-1968.yaml +183 -0
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +180 -0
- data/maps/royin-tha-Thai-Latn-1999.yaml +80 -0
- data/maps/{cn-chn-Hans-Latn-pinyin.yaml → sac-zho-Hans-Latn-1979.yaml} +11 -8
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +283 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +222 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +197 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
- data/maps/un-amh-Ethi-Latn-2016.yaml +602 -0
- data/maps/un-ara-Arab-Latn-1971.yaml +139 -0
- data/maps/un-ara-Arab-Latn-1972.yaml +159 -0
- data/maps/un-ara-Arab-Latn-2017.yaml +420 -0
- data/maps/un-bel-Cyrl-Latn-2007.yaml +114 -0
- data/maps/un-ben-Beng-Latn-2016.yaml +534 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.yaml +780 -0
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +31 -0
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +19 -0
- data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
- data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +350 -0
- data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +166 -0
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +53 -0
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +406 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +386 -0
- data/maps/var-kor-Hang-Hang-jamo.yaml +11193 -0
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +1054 -0
- data/maps/var-kor-Kore-Hang-2013.yaml +59754 -0
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
- data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
- data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
- data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
- data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +59 -0
- data/maps/var-tha-Thai-Zsym-ipa.yaml +301 -0
- data/maps/var-zho-Hani-Latn-wd-1979.yaml +38912 -0
- data/spec/interscript/filenames_spec.rb +384 -0
- data/spec/interscript/mapping_spec.rb +42 -0
- data/spec/interscript_spec.rb +23 -5
- data/spec/spec_helper.rb +3 -1
- metadata +364 -34
- data/bin/interscript +0 -20
- data/bin/rspec +0 -29
- data/maps/bgnpcgn-chn-Hans-Latn-pinyin.yaml +0 -7503
- data/maps/historic-jpn-Hrkt-Latn-hepburn.yaml +0 -336
- data/maps/icao-gre-Grek-Latn-9303.yaml +0 -101
- data/maps/mext-jpn-Hrkt-Latn-hepburn.yaml +0 -330
- data/maps/mext-jpn-Hrkt-Latn-kunrei.yaml +0 -308
- data/maps/un-jpn-Hrkt-Latn-hepburn.yaml +0 -313
- data/maps/un-jpn-Hrkt-Latn-kunrei.yaml +0 -354
- data/maps/un-mon-Mong-Latn-2013.yaml +0 -80
@@ -0,0 +1,264 @@
|
|
1
|
+
---
|
2
|
+
authority_id: un
|
3
|
+
id: phonetic-2013
|
4
|
+
language: iso-639-2:mon
|
5
|
+
source_script: Mong
|
6
|
+
destination_script: Latn
|
7
|
+
name: Mongolian Romanization in China, Version 4.0 (phonetic)
|
8
|
+
url: http://www.eki.ee/wgrs/rom1_mnc.htm
|
9
|
+
creation_date: 2013-09
|
10
|
+
description: |
|
11
|
+
The United Nations resolution III/8 in 1977 recognized the Scheme for
|
12
|
+
a Chinese Phonetic Alphabet (Pinyin) as China’s official Roman alphabet
|
13
|
+
scheme and recommended the alphabet as the international system for the
|
14
|
+
romanization of Chinese geographical names. In China Mongolian
|
15
|
+
geographical names are transcribed directly from the Mongolian script
|
16
|
+
into Pinyin. The scheme was published in Toponymic Guidelines for Map
|
17
|
+
and Other Editors: China, 1982.
|
18
|
+
|
19
|
+
The system is used in China and in international cartographic
|
20
|
+
products.
|
21
|
+
|
22
|
+
Mongolian uses a vertical script. Transcription of Mongolian names is
|
23
|
+
made from their proper pronunciation based on the written form of the
|
24
|
+
Mongolian language and Qahar vernacular, with Zhenglan as its
|
25
|
+
representative pronunciation. Due to the complex nature of the script
|
26
|
+
the romanization scheme is not reversible, e.g. the name of the city
|
27
|
+
Hohhot is written ᠬᠥᠬᠡᠬᠣᠲᠠ but may be transliterated as kökeqota.
|
28
|
+
|
29
|
+
notes:
|
30
|
+
- The long and short Mongolian vowels are not distinguished in the
|
31
|
+
spelling for general use, but in recording the pronunciation of
|
32
|
+
place-names, the long vowel is represented by duplication.
|
33
|
+
- Where two Roman equivalents are given, the second (in brackets) is
|
34
|
+
used for recording the pronunciation of place-names while the first
|
35
|
+
form is for general use.
|
36
|
+
- In the table only word-initial character variants are shown.
|
37
|
+
Depending on the position in the word many variants of the characters
|
38
|
+
are used as well as some ligatures. These features are not covered here.
|
39
|
+
- For technical reasons the characters of the Mongolian script are
|
40
|
+
turned 90˚ anti-clockwise.
|
41
|
+
|
42
|
+
implementation_notes:
|
43
|
+
- A separated final form of vowels a or e is common, and can appear at the end
|
44
|
+
of a word, word stem, or suffix. This form requires a final-shaped preceding
|
45
|
+
consonant and an inter-word gap in between. The vowels themselves appear as ᠠ,
|
46
|
+
and with consonants as ᠬᠠ q‑a, ᠷᠠ r‑a/r‑e, etc. This gap can be transliterated
|
47
|
+
with a hyphen. In digital typesetting, these forms are triggered by inserting
|
48
|
+
a U+180E MONGOLIAN VOWEL SEPARATOR (HTML ᠎ · MVS) between the consonant
|
49
|
+
and vowel.
|
50
|
+
- All case suffixes, as well as any plural suffixes consisting of one or two
|
51
|
+
syllables are likewise separated by a preceding and hyphen-transliterated gap.
|
52
|
+
In digital typesetting, this gap is represented by a U+202F NARROW NO-BREAK SPACE
|
53
|
+
(HTML   · NNBSP). A maximum of two case suffixes can be added to a stem.
|
54
|
+
Single-letter vowel suffixes appear with the final-shaped forms of a/e, i, or u/ü,
|
55
|
+
as in ᠭᠠᠵᠠᠷ ᠠ γaǰar‑a 'to the country' and ᠡᠳᠦᠷ ᠡ edür‑e 'on the day', or ᠤᠯᠤᠰ ᠢ ulus‑i
|
56
|
+
'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
|
57
|
+
medial- (vowels), or variant-shaped form.
|
58
|
+
|
59
|
+
tests:
|
60
|
+
- source: ᠣᠷᠳᠣᠰ ᠬᠣᠲᠠ # Ордос хот
|
61
|
+
expected: ôrdôs hôta
|
62
|
+
- source: ᠪᠠᠶᠠᠨᠨᠠᠭᠤᠷ ᠬᠣᠲᠠ # Баяннуур хот
|
63
|
+
expected: bayannagûr hôta
|
64
|
+
- source: ᠤᠯᠠᠭᠠᠨᠬᠣᠲᠠ # Улаан хот
|
65
|
+
expected: ûlaganhôta
|
66
|
+
- source: ᠬᠣᠣᠯᠢᠠ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Хоолингол хот
|
67
|
+
expected: hôôlia gôûl hôta
|
68
|
+
- source: ᠡᠷᠢᠶᠡᠨ ᠬᠣᠲᠠ # Эрээн хот
|
69
|
+
expected: eriyen hôta
|
70
|
+
- source: ᠷᠠᠰᠢᠶᠠᠨ ᠬᠣᠲᠠ # Рашаан хот
|
71
|
+
expected: rasiyan hôta
|
72
|
+
- source: ᠪᠠᠭᠠᠷᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Баарин баруун хошуу
|
73
|
+
expected: bagarin baragûn hôsigû
|
74
|
+
- source: ᠪᠠᠭᠠᠷᠢᠨ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Баарин зүүн хошуу
|
75
|
+
expected: bagarin jegun hôsigû
|
76
|
+
- source: ᠲᠦᠩᠯᠢᠶᠣᠤ ᠬᠣᠲᠠ # Байшинт хот
|
77
|
+
expected: tungliyôû hôta
|
78
|
+
- source: ᠰᠢᠯᠢ ᠶᠢᠨ ᠬᠣᠲᠠ # Шилийн хот
|
79
|
+
expected: sili-yin hôta
|
80
|
+
- source: ᠬᠣᠷᠢᠨ ᠭᠡᠷ ᠰᠢᠶᠠᠨ # Horinger County
|
81
|
+
expected: hôrin ger siyan
|
82
|
+
- source: ᠤᠳᠠ ᠲᠣᠭᠣᠷᠢᠭ # Уда тойрог
|
83
|
+
expected: ûda tôgôrig
|
84
|
+
- source: ᠦᠬᠠᠢ ᠬᠣᠲᠠ # Үхай хот
|
85
|
+
expected: uhai hôta
|
86
|
+
- source: ᠬᠠᠶᠢᠨᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hainan District
|
87
|
+
expected: hayinan tôgôrig
|
88
|
+
- source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan District
|
89
|
+
expected: hayirûb-ûn tôhôi tôgôrig
|
90
|
+
- source: ᠤᠯᠠᠭᠠᠨᠴᠠᠪ ᠬᠣᠲᠠ # Улаанцав хот
|
91
|
+
expected: ûlaganqab hôta
|
92
|
+
- source: ᠵᠢᠨᠢᠩ ᠲᠣᠭᠣᠷᠢᠭ # Жинин тойрог
|
93
|
+
expected: jining tôgôrig
|
94
|
+
- source: ᠹᠸᠩᠵᠸᠡ ᠬᠣᠲᠠ # Фенжень хот
|
95
|
+
expected: fwngjwe hôta
|
96
|
+
- source: ᠵᠦᠸᠧᠽᠢ ᠰᠢᠶᠠᠨ # Zhuozi County
|
97
|
+
expected: juwezi siyan
|
98
|
+
- source: ᠬᠤᠸᠠᠳᠧ ᠰᠢᠶᠠᠨ # Huade County
|
99
|
+
expected: hûwade siyan
|
100
|
+
- source: ᠱᠠᠩᠳᠤ ᠰᠢᠶᠠᠨ # Шанду шянь
|
101
|
+
expected: xangdû siyan
|
102
|
+
- source: ᠰᠢᠩᠾᠧ ᠰᠢᠶᠠᠨ # Шинхэ шянь
|
103
|
+
expected: singhe siyan
|
104
|
+
- source: ᠯᠢᠶᠠᠩᠴᠠᠩ ᠰᠢᠶᠠᠨ # Liangcheng County
|
105
|
+
expected: liyangqang siyan
|
106
|
+
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын өмнөд хошуу
|
107
|
+
expected: qahar baragûn garûn emunedu hôsigû
|
108
|
+
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын дундад хошуу
|
109
|
+
expected: qahar baragûn garûn dûmdadû hôsigû
|
110
|
+
- source: ᠴᠠᠬᠠᠷ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Цахар баруун гарын хойд хошуу
|
111
|
+
expected: qahar baragûn garûn hôyitû hôsigû
|
112
|
+
- source: ᠳᠥᠷᠪᠡᠳ ᠬᠣᠰᠢᠭᠤ # Дөрвөд хошуу
|
113
|
+
expected: dorbed hôsigû
|
114
|
+
- source: ᠪᠤᠭᠤᠲᠤ ᠬᠣᠲᠠ # Бугaт хот
|
115
|
+
expected: bûgûtû hôta
|
116
|
+
- source: ᠬᠥᠨᠳᠡᠯᠡᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hondlon District
|
117
|
+
expected: hondelen tôgôrig
|
118
|
+
- source: ᠳᠦᠩᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Donghe District
|
119
|
+
expected: dunghe tôgôrig
|
120
|
+
- source: ᠴᠢᠩᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Qingshan District
|
121
|
+
expected: qingxan tôgôrig
|
122
|
+
- source: ᠰᠢᠭᠤᠶᠢᠲᠤ ᠲᠣᠭᠣᠷᠢᠭ # Шигуай тойрог
|
123
|
+
expected: sigûyitû tôgôrig
|
124
|
+
- source: ᠵᠢᠦ ᠶᠤᠸᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Jiuyuan District
|
125
|
+
expected: jiu yûwan tôgôrig
|
126
|
+
- source: ᠭᠦᠶᠠᠩ ᠰᠢᠶᠠᠨ # Guyang County
|
127
|
+
expected: guyang siyan
|
128
|
+
- source: ᠲᠦᠮᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Зүүн хошуу
|
129
|
+
expected: tumed jegun hôsigû
|
130
|
+
- source: ᠲᠦᠮᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Түмэд Баруун хошуу
|
131
|
+
expected: tumed baragûn hôsigû
|
132
|
+
- source: ᠳᠠᠷᠬᠠᠨ ᠮᠤᠤᠮᠢᠩᠭ᠋ᠠᠨ ᠬᠣᠯᠪᠣᠭᠠᠲᠤ ᠬᠣᠰᠢᠭᠤ # Darhan Muminggan United Banner
|
133
|
+
expected: darhan mûûmingg᠋an hôlbôgatû hôsigû
|
134
|
+
- source: ᠬᠡᠰᠢᠭᠲᠡᠨ ᠬᠣᠰᠢᠭᠤ # Hexigten Banner
|
135
|
+
expected: hesigten hôsigû
|
136
|
+
- source: ᠰᠢᠨᠡ ᠪᠠᠷᠭᠤ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Left Banner
|
137
|
+
expected: sin-e bargû jegun hôsigû
|
138
|
+
- source: ᠰᠢᠨᠡ ᠪᠠᠷᠭᠤ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # New Barag Right Banner
|
139
|
+
expected: sin-e bargû baragûn hôsigû
|
140
|
+
- source: ᠣᠲᠣᠭ ᠬᠣᠰᠢᠭᠤ # Otog Banner
|
141
|
+
expected: ôtôg hôsigû
|
142
|
+
- source: ᠳ᠋ᠦᠩᠱᠧᠩ ᠲᠣᠭᠣᠷᠢᠭ # Dongsheng District
|
143
|
+
expected: d᠋ungxeng tôgôrig
|
144
|
+
- source: ᠳᠠᠯᠠᠳ ᠬᠣᠰᠢᠭᠤ # Dalad Banner
|
145
|
+
expected: dalad hôsigû
|
146
|
+
- source: ᠵᠡᠭᠦᠨᠭᠠᠷ ᠬᠣᠰᠢᠭᠤ # Jungar Banner
|
147
|
+
expected: jegungar hôsigû
|
148
|
+
- source: ᠣᠲᠣᠭ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Otog Front Banner
|
149
|
+
expected: ôtôg-ûn emunedu hôsigû
|
150
|
+
- source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠰᠢᠭᠤ # Hanggin Banner
|
151
|
+
expected: hanggin hôsigû
|
152
|
+
- source: ᠦᠦᠰᠢᠨ ᠬᠣᠰᠢᠭᠤ # Uxin Banner
|
153
|
+
expected: uusin hôsigû
|
154
|
+
- source: ᠡᠵᠢᠨ ᠬᠣᠷᠣᠭᠠ ᠬᠣᠰᠢᠭᠤ # Эзэн Хороо хошуу
|
155
|
+
expected: ejin hôrôg-a hôsigû
|
156
|
+
- source: ᠵᠠᠯᠠᠨ ᠠᠢ᠌ᠯ ᠬᠣᠲᠠ # Жалан-Айл хот
|
157
|
+
expected: jalan ai᠌l hôta
|
158
|
+
- source: ᠶᠠᠭᠰᠢ ᠬᠣᠲᠠ # Ягши хот
|
159
|
+
expected: yagsi hôta
|
160
|
+
- source: ᠮᠠᠨᠵᠤᠤᠷ ᠬᠣᠲᠠ # Манжуур хот
|
161
|
+
expected: manjûûr hôta
|
162
|
+
- source: ᠬᠠᠶᠢᠯᠠᠷ ᠲᠣᠭᠣᠷᠢᠭ # Хайлаар тойрог
|
163
|
+
expected: hayilar tôgôrig
|
164
|
+
- source: ᠬᠣᠷᠴᠢᠨ ᠲᠣᠭᠣᠷᠢᠭ # Horqin District
|
165
|
+
expected: hôrqin tôgôrig
|
166
|
+
- source: ᠺᠠᠶᠢᠯᠦ ᠰᠢᠶᠠᠨ # Kailu County
|
167
|
+
expected: kayilu siyan
|
168
|
+
- source: ᠬᠦᠷᠢᠶᠡ ᠬᠣᠰᠢᠭᠤ # Hure Banner
|
169
|
+
expected: huriy-e hôsigû
|
170
|
+
- source: ᠨᠠᠢᠮᠠᠨ ᠬᠣᠰᠢᠭᠤ # Naiman Banner
|
171
|
+
expected: naiman hôsigû
|
172
|
+
- source: ᠵᠠᠷᠤᠳ ᠬᠣᠰᠢᠭᠤ # Jarud Banner
|
173
|
+
expected: jarûd hôsigû
|
174
|
+
- source: ᠬᠣᠷᠴᠢᠨ ᠪᠠᠷᠠᠭᠤᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Хорчин Баруун Гарын Дундад Хошуу
|
175
|
+
expected: hôrqin baragûn garûn dûmdadû hôsigû
|
176
|
+
- source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Middle Banner
|
177
|
+
expected: hôrqin jegun garûn dûmdadû hôsigû
|
178
|
+
- source: ᠬᠣᠷᠴᠢᠨ ᠵᠡᠭᠦᠨ ᠭᠠᠷᠤᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Horqin Left Rear Banner
|
179
|
+
expected: hôrqin jegun garûn hôyitû hôsigû
|
180
|
+
- source: ᠤᠯᠠᠭᠠᠨᠬᠠᠳᠠ ᠬᠣᠲᠠ # Улаанхад хот
|
181
|
+
expected: ûlaganhada hôta
|
182
|
+
- source: ᠰᠡᠷᠡᠴᠢ # Salaqi
|
183
|
+
expected: sereqi
|
184
|
+
- source: ᠭᠡᠭᠡᠨ ᠭᠣᠤᠯ ᠬᠣᠲᠠ # Гэгээнгол хот
|
185
|
+
expected: gegen gôûl hôta
|
186
|
+
- source: ᠠᠯᠠᠱᠠ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Left Banner
|
187
|
+
expected: alaxa jegun hôsigû
|
188
|
+
- source: ᠠᠯᠠᠱᠠ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Alxa Right Banner
|
189
|
+
expected: alaxa baragûn hôsigû
|
190
|
+
- source: ᠡᠵᠡᠨᠡ ᠬᠣᠰᠢᠭᠤ # Ejin Banner
|
191
|
+
expected: ejen-e hôsigû
|
192
|
+
- source: ᠬᠥᠪᠡᠭᠡᠲᠦ ᠰᠢᠷᠠ ᠬᠣᠰᠢᠭᠤ # Хөвөөт Шар хошуу
|
193
|
+
expected: hobegetu sir-a hôsigû
|
194
|
+
- source: ᠦᠶᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Үюань шянь
|
195
|
+
expected: uyûwan siyan
|
196
|
+
- source: ᠦᠴᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Wuchuan County
|
197
|
+
expected: uqûwan siyan
|
198
|
+
- source: ᠲᠦᠴᠢᠤᠸᠠᠨ ᠰᠢᠶᠠᠨ # Тучуань шянь
|
199
|
+
expected: tuqiûwan siyan
|
200
|
+
- source: ᠨᠢᠩᠴᠧᠩ ᠰᠢᠶᠠᠨ # Ningcheng County
|
201
|
+
expected: ningqeng siyan
|
202
|
+
- source: ᠯᠢᠨᠰᠢ ᠰᠢᠶᠠᠨ # Linxi County
|
203
|
+
expected: linsi siyan
|
204
|
+
- source: ᠯᠢᠨᠾᠧ ᠲᠣᠭᠣᠷᠢᠭ # Linhe
|
205
|
+
expected: linhe tôgôrig
|
206
|
+
- source: ᠬᠠᠷᠠᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Harqin Banner
|
207
|
+
expected: haraqin hôsigû
|
208
|
+
- source: ᠳ᠋ᠧᠩᠺᠧᠦ ᠰᠢᠶᠠᠨ # Dengkou County
|
209
|
+
expected: d᠋engkeu siyan
|
210
|
+
- source: ᠠᠤᠬᠠᠨ ᠬᠣᠰᠢᠭᠤ # Aohan Banner
|
211
|
+
expected: aûhan hôsigû
|
212
|
+
- source: ᠴᠢᠩ ᠱᠦᠢ ᠾᠧ ᠰᠢᠶᠠᠨ # Qingshuihe County
|
213
|
+
expected: qing xui he siyan
|
214
|
+
- source: ᠬᠣᠳᠣᠩ ᠠᠷᠠᠳ ᠤᠨ ᠲᠣᠭᠣᠷᠢᠭ # Huimin District
|
215
|
+
expected: hôdông arad-ûn tôgôrig
|
216
|
+
- source: ᠰᠠᠶᠢᠬᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Saihan District
|
217
|
+
expected: sayihan tôgôrig
|
218
|
+
- source: ᠰᠢᠨᠡ ᠬᠣᠲᠠ ᠲᠣᠭᠣᠷᠢᠭ # Xincheng District
|
219
|
+
expected: sin-e hôta tôgôrig
|
220
|
+
- source: ᠬᠠᠶᠢᠷᠤᠪ ᠤᠨ ᠲᠣᠬᠣᠢ ᠲᠣᠭᠣᠷᠢᠭ # Haibowan (Hairibin Tohoi) District
|
221
|
+
expected: hayirûb-ûn tôhôi tôgôrig
|
222
|
+
- source: ᠰᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Songshan District
|
223
|
+
expected: sung xan tôgôrig
|
224
|
+
- source: ᠬᠦᠩ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Hongshan District
|
225
|
+
expected: hung xan tôgôrig
|
226
|
+
- source: ᠠᠷᠤᠨ ᠬᠣᠰᠢᠭᠤ # Арун хошуу
|
227
|
+
expected: arûn hôsigû
|
228
|
+
- source: ᠶᠤᠸᠠᠨ ᠪᠣᠣ ᠱᠠᠨ ᠲᠣᠭᠣᠷᠢᠭ # Юаньбаошань тойрог
|
229
|
+
expected: yûwan bôô xan tôgôrig
|
230
|
+
- source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠪᠡᠭᠡᠲᠦ ᠴᠠᠭᠠᠨ ᠬᠣᠰᠢᠭᠤ # Шулуун Хөвөөт Цагаан хошуу
|
231
|
+
expected: silûgûn hobegetu qagan hôsigû
|
232
|
+
- source: ᠰᠢᠯᠤᠭᠤᠨ ᠬᠥᠬᠡ ᠬᠣᠰᠢᠭᠤ # Шулуун хөх хошуу
|
233
|
+
expected: silûgûn hohe hôsigû
|
234
|
+
- source: ᠤᠷᠠᠳ ᠤᠨ ᠳᠤᠮᠳᠠᠳᠤ ᠬᠣᠰᠢᠭᠤ # Урадын Дундад Хошуу
|
235
|
+
expected: ûrad-ûn dûmdadû hôsigû
|
236
|
+
- source: ᠤᠷᠠᠳ ᠤᠨ ᠡᠮᠦᠨᠡᠳᠦ ᠬᠣᠰᠢᠭᠤ # Урадын Өмнөд Хошуу
|
237
|
+
expected: ûrad-ûn emunedu hôsigû
|
238
|
+
- source: ᠲᠣᠭᠲᠠᠬᠤ ᠰᠢᠶᠠᠨ # Тогтох шянь
|
239
|
+
expected: tôgtahû siyan
|
240
|
+
- source: ᠲᠠᠶᠢᠫᠤᠰᠧ ᠬᠣᠰᠢᠭᠤ # Тайвас хошуу
|
241
|
+
expected: tayipûse hôsigû
|
242
|
+
- source: ᠰᠥᠨᠡᠳ ᠵᠡᠭᠦᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Left Banner
|
243
|
+
expected: soned jegun hôsigû
|
244
|
+
- source: ᠰᠥᠨᠡᠳ ᠪᠠᠷᠠᠭᠤᠨ ᠬᠣᠰᠢᠭᠤ # Sonid Right Banner
|
245
|
+
expected: soned baragûn hôsigû
|
246
|
+
- source: ᠣᠩᠨᠢᠭᠤᠳ ᠬᠣᠰᠢᠭᠤ # Ongniud Banner
|
247
|
+
expected: ôngnigûd hôsigû
|
248
|
+
- source: ᠵᠠᠯᠠᠢᠳ ᠬᠣᠰᠢᠭᠤ # Jalaid Banner
|
249
|
+
expected: jalaid hôsigû
|
250
|
+
- source: ᠬᠠᠩᠭᠢᠨ ᠬᠣᠶᠢᠲᠤ ᠬᠣᠰᠢᠭᠤ # Hanggin Rear Banner
|
251
|
+
expected: hanggin hôyitû hôsigû
|
252
|
+
- source: ᠵᠡᠭᠦᠨ ᠤᠵᠤᠮᠤᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # East Ujimqin Banner
|
253
|
+
expected: jegun ûjûmûqin hôsigû
|
254
|
+
- source: ᠠᠷᠤ ᠬᠣᠷᠴᠢᠨ ᠬᠣᠰᠢᠭᠤ # Ar Horqin Banner
|
255
|
+
expected: arû hôrqin hôsigû
|
256
|
+
- source: ᠠᠪᠠᠭᠠ ᠬᠣᠰᠢᠭᠤ # Abag Banner
|
257
|
+
expected: abag-a hôsigû
|
258
|
+
- source: ᠪᠤᠷᠢᠶᠠᠳ # Буриад
|
259
|
+
expected: bûriyad
|
260
|
+
- source: ᠤᠯᠠᠭᠠᠨᠪᠠᠭᠠᠲᠤᠷ # Улаанбаатар
|
261
|
+
expected: ûlaganbagatûr
|
262
|
+
|
263
|
+
map:
|
264
|
+
inherit: sasm-mon-Mong-Latn-phonetic-1978
|
@@ -0,0 +1,350 @@
|
|
1
|
+
---
|
2
|
+
authority_id: ungegn
|
3
|
+
id: 1972
|
4
|
+
language: iso-639-2:nep
|
5
|
+
source_script: Deva
|
6
|
+
destination_script: Latn
|
7
|
+
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
|
8
|
+
url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
|
9
|
+
creation_date: 1972
|
10
|
+
confirmation_date: 2010
|
11
|
+
description: |
|
12
|
+
The United Nations recommended system was approved in 1972 (II/11), based on a report
|
13
|
+
prepared by D. N. Sharma. The note on the system was published in volume II of the
|
14
|
+
conference report.
|
15
|
+
|
16
|
+
There is no evidence of the use of the system either in Nepal or in international cartographic
|
17
|
+
products. The resolution IV/17 (1982) recommended association, inter alia, with Nepal in
|
18
|
+
carrying out further studies on the system. In Nepal a system of romanization is employed by
|
19
|
+
the Nepal Survey Department (NSD). This system has been applied to names appearing on
|
20
|
+
national mapping, and it is also used in the Geographic Information Infrastructure Programme
|
21
|
+
(NGIIP).
|
22
|
+
|
23
|
+
Nepali (Nepālī) uses the alphasyllabic script Devanāgarī.
|
24
|
+
|
25
|
+
notes:
|
26
|
+
|
27
|
+
- In normal spelling ṙ and ṙh are not marked, instead dotless ड ḍa, ढ ḍha are used to denote these sounds.
|
28
|
+
- |
|
29
|
+
Ligatures may be formed with r as the first component: ~ह rha.
|
30
|
+
|
31
|
+
######################################## Additional Note ############################################################
|
32
|
+
# It is recommended that the vowel अ (a) should always be romanized except when it ends a #
|
33
|
+
# name. In the scheme we are not yet able to detect a name. Analysing language pattern and the example #
|
34
|
+
# we found that actually when a word ends with a consonant it should be transliterated without the vowel in it. #
|
35
|
+
# so we are applying this rule as if a word ends with a consonant, in this case we are removing the ending 'a'. #
|
36
|
+
#####################################################################################################################
|
37
|
+
|
38
|
+
|
39
|
+
tests:
|
40
|
+
- source: "नेपाल"
|
41
|
+
expected: "nepāl"
|
42
|
+
- source: "नेपाल काठ्माडौं"
|
43
|
+
expected: "nepāl kāṭhmāḍauṁ"
|
44
|
+
- source: "लेखन"
|
45
|
+
expected: "lekhan"
|
46
|
+
- source: "मुद्रा"
|
47
|
+
expected: "mudrā"
|
48
|
+
- source: "प्रशंसा"
|
49
|
+
expected: "prashaṁsā"
|
50
|
+
- source: "अंक"
|
51
|
+
expected: "aṁk"
|
52
|
+
- source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
|
53
|
+
expected: "nekapāle sthagit sthāyī kamiṭīko baiṭhak bhadau gate bolāune bhaeko"
|
54
|
+
- source: "न घर रह्यो, न परिवार"
|
55
|
+
expected: "n ghar rahyo, n parivār"
|
56
|
+
- source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
|
57
|
+
expected: "ḍhorapāṭanamā bhujīkholā bāḍhīpahirole abhibhāvak gumāekā bālabālikāko bichallī"
|
58
|
+
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
59
|
+
expected: "susmitākā kākā hemabahādur r kākīlāī pani pahirole bagāyo"
|
60
|
+
- source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
|
61
|
+
expected: "saṁvidhān jārī bhaesam̐gai sārvajanik prashāsanamā nayām̐ utsāh āune apekṣhā thiyo"
|
62
|
+
- source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
|
63
|
+
expected: "deshamā koronā saṁkramit r mṛtakako saṁkhyā harek din baḍhdo chh"
|
64
|
+
- source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
|
65
|
+
expected: "gāum̐pālikākā adhyakṣh ṭikā guruṅakā anusār viṣhṇudāsalāī rājule sutnakā lāgi belukā sāthī lagekā thie"
|
66
|
+
- source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
|
67
|
+
expected: "yo āyojanā gāum̐pālikāko kendr tellokamā parchh"
|
68
|
+
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
69
|
+
expected: "susmitākā kākā hemabahādur r kākīlāī pani pahirole bagāyo"
|
70
|
+
- source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
|
71
|
+
expected: "chait pahilo sātā ghar āekā unī lakaḍāun bhaepachhi yatai rokie"
|
72
|
+
- source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
|
73
|
+
expected: "kām garn jāneko hakamā rojagāradātā kampanīko patrasam̐gai vaḍā r jillā prashāsanako siphāris anivāry garieko chh"
|
74
|
+
- source: "ऋण"
|
75
|
+
expected: "ṛṇ"
|
76
|
+
- source: "अर्पित"
|
77
|
+
expected: "arpit"
|
78
|
+
- source: "अरार्यते"
|
79
|
+
expected: "arāryate"
|
80
|
+
- source: "श्रीमान्"
|
81
|
+
expected: "shrīmān"
|
82
|
+
- source: "खाँचो बिरुवा बैंकको"
|
83
|
+
expected: "khām̐cho biruvā baiṁkako"
|
84
|
+
|
85
|
+
|
86
|
+
map:
|
87
|
+
|
88
|
+
rules:
|
89
|
+
- pattern: ([क]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
90
|
+
result: 'k'
|
91
|
+
- pattern: ([ख]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
92
|
+
result: 'kh'
|
93
|
+
- pattern: ([ग]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
94
|
+
result: 'g'
|
95
|
+
- pattern: ([घ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
96
|
+
result: 'gh'
|
97
|
+
- pattern: ([ङ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
98
|
+
result: 'ṅ'
|
99
|
+
- pattern: ([च]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
100
|
+
result: 'ch'
|
101
|
+
- pattern: ([छ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
102
|
+
result: 'chh'
|
103
|
+
- pattern: ([ज]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
104
|
+
result: 'j'
|
105
|
+
- pattern: ([झ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
106
|
+
result: 'jh'
|
107
|
+
- pattern: ([ञ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
108
|
+
result: 'ñ'
|
109
|
+
- pattern: ([ट]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
110
|
+
result: 'ṭ'
|
111
|
+
- pattern: ([ठ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
112
|
+
result: 'ṭh'
|
113
|
+
- pattern: ([ड]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
114
|
+
result: 'ḍ'
|
115
|
+
- pattern: ([ढ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
116
|
+
result: 'ḍh'
|
117
|
+
- pattern: ([ण]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
118
|
+
result: 'ṇ'
|
119
|
+
- pattern: ([त]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
120
|
+
result: 't'
|
121
|
+
- pattern: ([थ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
122
|
+
result: 'th'
|
123
|
+
- pattern: ([द]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
124
|
+
result: 'd'
|
125
|
+
- pattern: ([ध]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
126
|
+
result: 'dh'
|
127
|
+
- pattern: ([न]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
128
|
+
result: 'n'
|
129
|
+
- pattern: ([प]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
130
|
+
result: 'p'
|
131
|
+
- pattern: ([फ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
132
|
+
result: 'ph'
|
133
|
+
- pattern: ([ब]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
134
|
+
result: 'b'
|
135
|
+
- pattern: ([भ]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
136
|
+
result: 'bh'
|
137
|
+
- pattern: ([म]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
138
|
+
result: 'm'
|
139
|
+
- pattern: ([य]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
140
|
+
result: 'y'
|
141
|
+
- pattern: ([र]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
142
|
+
result: 'r'
|
143
|
+
- pattern: ([ल]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
144
|
+
result: 'l'
|
145
|
+
- pattern: ([व]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
146
|
+
result: 'v'
|
147
|
+
- pattern: ([श]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
148
|
+
result: 'sh'
|
149
|
+
- pattern: ([ष]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
150
|
+
result: 'ṣh'
|
151
|
+
- pattern: ([स]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
152
|
+
result: 's'
|
153
|
+
- pattern: ([क़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
154
|
+
result: 'q'
|
155
|
+
- pattern: ([ख़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
156
|
+
result: 'ḳh'
|
157
|
+
- pattern: ([ग़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
158
|
+
result: 'g'
|
159
|
+
- pattern: ([ज़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
160
|
+
result: 'z'
|
161
|
+
- pattern: ([ड़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
162
|
+
result: 'ṙ'
|
163
|
+
- pattern: ([ढ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
164
|
+
result: 'ṙh'
|
165
|
+
- pattern: ([फ़]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
166
|
+
result: 'f'
|
167
|
+
- pattern: ([ह]=?)(?=[\u093E\u093F\u0940\u0941\u0942\u0943\u0944\u0945\u0947\u0948\u0949\u094B\u094C\u0020\u094d])
|
168
|
+
result: 'h'
|
169
|
+
|
170
|
+
|
171
|
+
- pattern: ([क])(?=\b)
|
172
|
+
result: 'k'
|
173
|
+
- pattern: ([ख])(?=\b)
|
174
|
+
result: 'kh'
|
175
|
+
- pattern: ([ग])(?=\b)
|
176
|
+
result: 'g'
|
177
|
+
- pattern: ([घ])(?=\b)
|
178
|
+
result: 'gh'
|
179
|
+
- pattern: ([ङ])(?=\b)
|
180
|
+
result: 'ṅ'
|
181
|
+
- pattern: ([च])(?=\b)
|
182
|
+
result: 'ch'
|
183
|
+
- pattern: ([छ])(?=\b)
|
184
|
+
result: 'chh'
|
185
|
+
- pattern: ([ज])(?=\b)
|
186
|
+
result: 'j'
|
187
|
+
- pattern: ([झ])(?=\b)
|
188
|
+
result: 'jh'
|
189
|
+
- pattern: ([ञ])(?=\b)
|
190
|
+
result: 'ñ'
|
191
|
+
- pattern: ([ट])(?=\b)
|
192
|
+
result: 'ṭ'
|
193
|
+
- pattern: ([ठ])(?=\b)
|
194
|
+
result: 'ṭh'
|
195
|
+
- pattern: ([ड])(?=\b)
|
196
|
+
result: 'ḍ'
|
197
|
+
- pattern: ([ढ])(?=\b)
|
198
|
+
result: 'ḍh'
|
199
|
+
- pattern: ([ण])(?=\b)
|
200
|
+
result: 'ṇ'
|
201
|
+
- pattern: ([त])(?=\b)
|
202
|
+
result: 't'
|
203
|
+
- pattern: ([थ])(?=\b)
|
204
|
+
result: 'th'
|
205
|
+
- pattern: ([द])(?=\b)
|
206
|
+
result: 'd'
|
207
|
+
- pattern: ([ध])(?=\b)
|
208
|
+
result: 'dh'
|
209
|
+
- pattern: ([न])(?=\b)
|
210
|
+
result: 'n'
|
211
|
+
- pattern: ([प])(?=\b)
|
212
|
+
result: 'p'
|
213
|
+
- pattern: ([फ])(?=\b)
|
214
|
+
result: 'ph'
|
215
|
+
- pattern: ([ब])(?=\b)
|
216
|
+
result: 'b'
|
217
|
+
- pattern: ([भ])(?=\b)
|
218
|
+
result: 'bh'
|
219
|
+
- pattern: ([म])(?=\b)
|
220
|
+
result: 'm'
|
221
|
+
- pattern: ([य])(?=\b)
|
222
|
+
result: 'y'
|
223
|
+
- pattern: ([र])(?=\b)
|
224
|
+
result: 'r'
|
225
|
+
- pattern: ([ल])(?=\b)
|
226
|
+
result: 'l'
|
227
|
+
- pattern: ([व])(?=\b)
|
228
|
+
result: 'v'
|
229
|
+
- pattern: ([श])(?=\b)
|
230
|
+
result: 'sh'
|
231
|
+
- pattern: ([ष])(?=\b)
|
232
|
+
result: 'ṣh'
|
233
|
+
- pattern: ([स])(?=\b)
|
234
|
+
result: 's'
|
235
|
+
- pattern: ([क़])(?=\b)
|
236
|
+
result: 'q'
|
237
|
+
- pattern: ([ख़])(?=\b)
|
238
|
+
result: 'ḳh'
|
239
|
+
- pattern: ([ग़])(?=\b)
|
240
|
+
result: 'g'
|
241
|
+
- pattern: ([ज़])(?=\b)
|
242
|
+
result: 'z'
|
243
|
+
- pattern: ([ड़])(?=\b)
|
244
|
+
result: 'ṙ'
|
245
|
+
- pattern: ([ढ़])(?=\b)
|
246
|
+
result: 'ṙh'
|
247
|
+
- pattern: ([फ़])(?=\b)
|
248
|
+
result: 'f'
|
249
|
+
- pattern: ([ह])(?=\b)
|
250
|
+
result: 'h'
|
251
|
+
|
252
|
+
characters:
|
253
|
+
|
254
|
+
# Vowels and Diphthongs
|
255
|
+
'अ': 'a'
|
256
|
+
'आ': 'ā'
|
257
|
+
'इ': 'i'
|
258
|
+
'ई': 'ī'
|
259
|
+
'उ': 'u'
|
260
|
+
'ऊ': 'ū'
|
261
|
+
'ऋ': 'ṛ'
|
262
|
+
'ॠ': 'ṝ'
|
263
|
+
'ऌ': 'l̤'
|
264
|
+
'ए': 'e'
|
265
|
+
'ऐ': 'ai'
|
266
|
+
'ओ': 'o'
|
267
|
+
'औ': 'au'
|
268
|
+
|
269
|
+
# Medials # Needed for connecting constants
|
270
|
+
|
271
|
+
'ा': "ā"
|
272
|
+
'ि': "i"
|
273
|
+
'ी': "ī"
|
274
|
+
'ु': "u"
|
275
|
+
'ू': "ū"
|
276
|
+
'ृ': "ṛ"
|
277
|
+
'े': "e"
|
278
|
+
'ै': "ai"
|
279
|
+
'ो': "o"
|
280
|
+
'ौ': "au"
|
281
|
+
|
282
|
+
# Consonants (see Note 1)
|
283
|
+
|
284
|
+
# Gutturals
|
285
|
+
'क': 'ka'
|
286
|
+
'ख': 'kha'
|
287
|
+
'ग': 'ga'
|
288
|
+
'घ': 'gha'
|
289
|
+
'ङ': 'ṅa'
|
290
|
+
|
291
|
+
# Palatals
|
292
|
+
'च': 'cha'
|
293
|
+
'छ': 'chha'
|
294
|
+
'ज': 'ja'
|
295
|
+
'झ': 'jha'
|
296
|
+
'ञ': 'ña'
|
297
|
+
|
298
|
+
# Cerebrals
|
299
|
+
'ट': 'ṭa'
|
300
|
+
'ठ': 'ṭha'
|
301
|
+
'ड': 'ḍa'
|
302
|
+
'ढ': 'ḍha'
|
303
|
+
'ण': 'ṇa'
|
304
|
+
|
305
|
+
# Dentals
|
306
|
+
'त': 'ta'
|
307
|
+
'थ': 'tha'
|
308
|
+
'द': 'da'
|
309
|
+
'ध': 'dha'
|
310
|
+
'न': 'na'
|
311
|
+
|
312
|
+
# Labials
|
313
|
+
'प': 'pa'
|
314
|
+
'फ': 'pha'
|
315
|
+
'ब': 'ba'
|
316
|
+
'भ': 'bha'
|
317
|
+
'म': 'ma'
|
318
|
+
|
319
|
+
# Semivowels
|
320
|
+
'य': 'ya'
|
321
|
+
'र': 'ra'
|
322
|
+
'ल': 'la'
|
323
|
+
'व': 'va' # or wa [Note#3]
|
324
|
+
|
325
|
+
# Sibilants
|
326
|
+
'श': 'sha'
|
327
|
+
'ष': 'ṣha'
|
328
|
+
'स': 'sa'
|
329
|
+
|
330
|
+
# Dotted variants
|
331
|
+
'क़': qa
|
332
|
+
'ख़': ḳha
|
333
|
+
'ग़': ga
|
334
|
+
'ज़': za
|
335
|
+
'ड़': ṙa
|
336
|
+
'ढ़': ṙha
|
337
|
+
'फ़': fa
|
338
|
+
|
339
|
+
|
340
|
+
# Aspirate
|
341
|
+
'ह': 'ha'
|
342
|
+
|
343
|
+
# Anusvāra
|
344
|
+
'ं': 'ṁ'
|
345
|
+
|
346
|
+
# Anunāsika
|
347
|
+
'ँ': 'm̐'
|
348
|
+
|
349
|
+
# halanta
|
350
|
+
'्': ''
|