interscript 0.1.6 → 2.1.0a9
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.gitignore +11 -0
- data/.rspec +3 -0
- data/Gemfile +29 -0
- data/LICENSE.adoc +31 -0
- data/README.md +3 -0
- data/Rakefile +53 -0
- data/bin/console +14 -0
- data/bin/interscript +3 -39
- data/bin/maps_analyze_staging +168 -0
- data/bin/maps_debug_compilers +58 -0
- data/bin/maps_debug_ordering +88 -0
- data/bin/maps_debug_ruby_compile +24 -0
- data/bin/maps_debug_step_by_step +44 -0
- data/bin/maps_optimize_order +112 -0
- data/bin/maps_v1_analyze_regexps +45 -0
- data/bin/maps_v1_to_v2 +426 -0
- data/exe/interscript +6 -0
- data/interscript.gemspec +31 -0
- data/lib/interscript.rb +81 -127
- data/lib/interscript/command.rb +5 -5
- data/lib/interscript/compiler.rb +22 -0
- data/lib/interscript/compiler/javascript.rb +292 -0
- data/lib/interscript/compiler/ruby.rb +262 -0
- data/lib/interscript/dsl.rb +67 -0
- data/lib/interscript/dsl/aliases.rb +23 -0
- data/lib/interscript/dsl/document.rb +46 -0
- data/lib/interscript/dsl/group.rb +45 -0
- data/lib/interscript/dsl/group/parallel.rb +6 -0
- data/lib/interscript/dsl/items.rb +89 -0
- data/lib/interscript/dsl/metadata.rb +26 -0
- data/lib/interscript/dsl/stage.rb +6 -0
- data/lib/interscript/dsl/symbol_mm.rb +11 -0
- data/lib/interscript/dsl/tests.rb +12 -0
- data/lib/interscript/interpreter.rb +251 -0
- data/lib/interscript/node.rb +25 -0
- data/lib/interscript/node/alias_def.rb +15 -0
- data/lib/interscript/node/dependency.rb +13 -0
- data/lib/interscript/node/document.rb +45 -0
- data/lib/interscript/node/group.rb +34 -0
- data/lib/interscript/node/group/parallel.rb +9 -0
- data/lib/interscript/node/group/sequential.rb +2 -0
- data/lib/interscript/node/item.rb +52 -0
- data/lib/interscript/node/item/alias.rb +42 -0
- data/lib/interscript/node/item/any.rb +61 -0
- data/lib/interscript/node/item/capture.rb +50 -0
- data/lib/interscript/node/item/group.rb +51 -0
- data/lib/interscript/node/item/repeat.rb +40 -0
- data/lib/interscript/node/item/stage.rb +23 -0
- data/lib/interscript/node/item/string.rb +51 -0
- data/lib/interscript/node/metadata.rb +18 -0
- data/lib/interscript/node/rule.rb +6 -0
- data/lib/interscript/node/rule/funcall.rb +18 -0
- data/lib/interscript/node/rule/run.rb +15 -0
- data/lib/interscript/node/rule/sub.rb +65 -0
- data/lib/interscript/node/stage.rb +19 -0
- data/lib/interscript/node/tests.rb +15 -0
- data/lib/interscript/stdlib.rb +211 -0
- data/lib/interscript/utils/regexp_converter.rb +283 -0
- data/lib/interscript/version.rb +1 -1
- data/requirements.txt +1 -0
- metadata +75 -339
- data/README.adoc +0 -298
- data/bin/rspec +0 -29
- data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
- data/lib/g2pwrapper.py +0 -34
- data/lib/interscript-opal.rb +0 -2
- data/lib/interscript/fs.rb +0 -71
- data/lib/interscript/mapping.rb +0 -142
- data/lib/interscript/opal.rb +0 -27
- data/lib/interscript/opal/maps.js.erb +0 -10
- data/lib/interscript/opal_map_translate.rb +0 -12
- data/lib/model-7 +0 -0
- data/lib/tha-pt-b-7 +0 -0
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +0 -38912
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +0 -509
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +0 -138
- data/maps/alalc-ara-Arab-Latn-1997.yaml +0 -1283
- data/maps/alalc-asm-Deva-Latn-1997.yaml +0 -159
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +0 -141
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +0 -125
- data/maps/alalc-ben-Beng-Latn-2017.yaml +0 -130
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +0 -94
- data/maps/alalc-ell-Grek-Latn-1997.yaml +0 -624
- data/maps/alalc-ell-Grek-Latn-2010.yaml +0 -627
- data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
- data/maps/alalc-kat-Geok-Latn-1997.yaml +0 -111
- data/maps/alalc-kat-Geor-Latn-1997.yaml +0 -146
- data/maps/alalc-kor-Hang-Latn-1997.yaml +0 -94
- data/maps/alalc-mar-Deva-Latn-1997.yaml +0 -170
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +0 -103
- data/maps/alalc-pan-Deva-Latn-1997.yaml +0 -237
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +0 -221
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +0 -162
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +0 -114
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +0 -135
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +0 -141
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +0 -16
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +0 -283
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +0 -174
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +0 -169
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +0 -292
- data/maps/bgn-kor-Hang-Latn-1943.yaml +0 -31
- data/maps/bgn-kor-Kore-Latn-1943.yaml +0 -31
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +0 -208
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +0 -208
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +0 -528
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +0 -592
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +0 -108
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +0 -104
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +0 -184
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +0 -285
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +0 -115
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +0 -38
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +0 -701
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +0 -19
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +0 -257
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +0 -127
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +0 -42
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +0 -253
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +0 -48
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +0 -159
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +0 -190
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +0 -200
- data/maps/bgnpcgn-per-Arab-Latn-1956.yaml +0 -92
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +0 -314
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +0 -166
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +0 -162
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +0 -208
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +0 -7456
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +0 -159
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +0 -156
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +0 -184
- data/maps/bis-gjr-Gujr-Latn-13194-1991.yaml +0 -166
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +0 -173
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +0 -176
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +0 -160
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +0 -175
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +0 -170
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +0 -155
- data/maps/by-bel-Cyrl-Latn-1998.yaml +0 -168
- data/maps/by-bel-Cyrl-Latn-2007.yaml +0 -115
- data/maps/dos-nep-Deva-Latn-1997.yaml +0 -33
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +0 -684
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +0 -680
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +0 -19
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +0 -31
- data/maps/ggg-kat-Geor-Latn-2002.yaml +0 -88
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +0 -33
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +0 -201
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +0 -186
- data/maps/hk-yue-Hani-Latn-1888.yaml +0 -38497
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +0 -136
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +0 -118
- data/maps/icao-heb-Hebr-Latn-9303.yaml +0 -151
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-per-Arab-Latn-9303.yaml +0 -103
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +0 -117
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +0 -119
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +0 -323
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +0 -609
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +0 -40
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +0 -62
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +0 -271
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +0 -109
- data/maps/kp-kor-Hang-Latn-2002.yaml +0 -901
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +0 -44820
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +0 -411
- data/maps/moct-kor-Hang-Latn-2000.yaml +0 -803
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +0 -541
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +0 -225
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +0 -63
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +0 -109
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +0 -37
- data/maps/nil-kor-Hang-Hang-jamo.yaml +0 -11193
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +0 -144
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +0 -96
- data/maps/odni-hin-Deva-Latn-2015.yaml +0 -258
- data/maps/odni-kat-Geor-Latn-2015.yaml +0 -87
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +0 -136
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +0 -122
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +0 -77
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +0 -129
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +0 -142
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +0 -148
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +0 -138
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +0 -157
- data/maps/odni-urd-Arab-Latn-2015.yaml +0 -221
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +0 -166
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +0 -90
- data/maps/royin-tha-Thai-Latn-1968.yaml +0 -179
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +0 -180
- data/maps/royin-tha-Thai-Latn-1999.yaml +0 -76
- data/maps/sac-zho-Hans-Latn-1979.yaml +0 -24759
- data/maps/ses-ara-Arab-Latn-1930.yaml +0 -279
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +0 -222
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +0 -193
- data/maps/un-ara-Arab-Latn-1971.yaml +0 -139
- data/maps/un-ara-Arab-Latn-1972.yaml +0 -159
- data/maps/un-ara-Arab-Latn-2017.yaml +0 -420
- data/maps/un-bel-Cyrl-Latn-2007.yaml +0 -114
- data/maps/un-ben-Beng-Latn-2016.yaml +0 -534
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +0 -31
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +0 -19
- data/maps/un-ell-Grek-Latn-phonetic-1987.yaml +0 -780
- data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
- data/maps/un-nep-Deva-Latn-1972.yaml +0 -163
- data/maps/un-rus-Cyrl-Latn-1987.yaml +0 -166
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +0 -30
- data/maps/ungegn-amh-Ethi-Latn-2016.yaml +0 -575
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +0 -406
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +0 -386
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +0 -1054
- data/maps/var-kor-Kore-Hang-2013.yaml +0 -59754
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +0 -36
- data/maps/var-tha-Thai-Thai-phonemic.yaml +0 -59
- data/maps/var-tha-Thai-Zsym-ipa.yaml +0 -301
- data/maps/var-zho-Hani-Latn-1979.yaml +0 -38908
- data/spec/interscript/mapping_spec.rb +0 -42
- data/spec/interscript_spec.rb +0 -26
- data/spec/spec_helper.rb +0 -3
|
@@ -1,99 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: un
|
|
3
|
-
id: 2013
|
|
4
|
-
language: mon
|
|
5
|
-
source_script: Mong
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: Mongolian Romanization in China, Version 4.0
|
|
8
|
-
url: http://www.eki.ee/wgrs/rom1_mnc.htm
|
|
9
|
-
creation_date: 2013-09
|
|
10
|
-
description: |
|
|
11
|
-
The United Nations resolution III/8 in 1977 recognized the Scheme for
|
|
12
|
-
a Chinese Phonetic Alphabet (Pinyin) as China’s official Roman alphabet
|
|
13
|
-
scheme and recommended the alphabet as the international system for the
|
|
14
|
-
romanization of Chinese geographical names. In China Mongolian
|
|
15
|
-
geographical names are transcribed directly from the Mongolian script
|
|
16
|
-
into Pinyin. The scheme was published in Toponymic Guidelines for Map
|
|
17
|
-
and Other Editors: China, 19821.
|
|
18
|
-
|
|
19
|
-
The system is used in China and in international cartographic
|
|
20
|
-
products.
|
|
21
|
-
|
|
22
|
-
Mongolian uses a vertical script. Transcription of Mongolian names is
|
|
23
|
-
made from their proper pronunciation based on the written form of the
|
|
24
|
-
Mongolian language and Qahar vernacular, with Zhenglan as its
|
|
25
|
-
representative pronunciation. Due to the complex nature of the script
|
|
26
|
-
the romanization scheme is not reversible, e.g. the name of the city
|
|
27
|
-
Hohhot is written ᠬᠥᠬᠡᠬᠣᠲᠠ but may be transliterated as kökeqota.
|
|
28
|
-
|
|
29
|
-
notes:
|
|
30
|
-
- The long and short Mongolian vowels are not distinguished in the
|
|
31
|
-
spelling for general use, but in recording the pronunciation of
|
|
32
|
-
place-names, the long vowel is represented by duplication.
|
|
33
|
-
- Where two Roman equivalents are given, the second (in brackets) is
|
|
34
|
-
used for recording the pronunciation of place-names while the first
|
|
35
|
-
form is for general use.
|
|
36
|
-
- In the table only word-initial character variants are shown.
|
|
37
|
-
Depending on the position in the word many variants of the characters
|
|
38
|
-
are used as well as some ligatures. These features are not covered here.
|
|
39
|
-
- For technical reasons the characters of the Mongolian script are
|
|
40
|
-
turned 90˚ anti-clockwise.
|
|
41
|
-
|
|
42
|
-
tests:
|
|
43
|
-
- source: "ᠬᠥᠬᠡᠬᠣᠲᠠ"
|
|
44
|
-
expected: "kökeqota"
|
|
45
|
-
map:
|
|
46
|
-
rules:
|
|
47
|
-
- pattern: \u182c(\u1821|\u1825|\u1826)
|
|
48
|
-
result: "k\\1"
|
|
49
|
-
- pattern: \u182d(\u1821|\u1825|\u1826)
|
|
50
|
-
result: "g\\1"
|
|
51
|
-
|
|
52
|
-
characters:
|
|
53
|
-
"ᠠ": "a"
|
|
54
|
-
"ᠪ": "b"
|
|
55
|
-
"ᠼ": "c"
|
|
56
|
-
"ᠲ": "d"
|
|
57
|
-
"ᠳ": "d"
|
|
58
|
-
"ᠡ": "e"
|
|
59
|
-
"ᠹ": "f"
|
|
60
|
-
"ᠭ": "ġ"
|
|
61
|
-
"ᠺ": "g"
|
|
62
|
-
"ᠬ": "q"
|
|
63
|
-
"ᠾ": "h"
|
|
64
|
-
"ᠢ": "i"
|
|
65
|
-
"ᠵ": "j"
|
|
66
|
-
"ᠺ": "k"
|
|
67
|
-
"ᠯ": "l"
|
|
68
|
-
"ᠮ": "m"
|
|
69
|
-
"ᠨ": "n"
|
|
70
|
-
"ᠥ": "ö"
|
|
71
|
-
"ᠫ": "p"
|
|
72
|
-
"ᠴ": "q"
|
|
73
|
-
"ᠷ": "r"
|
|
74
|
-
"ᠰ": "s"
|
|
75
|
-
"ᠲ": "t"
|
|
76
|
-
"ᠦ": "u"
|
|
77
|
-
"ᠸ": "w"
|
|
78
|
-
"ᠱ": "x"
|
|
79
|
-
"ᠶ": "y"
|
|
80
|
-
"ᠽ": "z"
|
|
81
|
-
"ᠣ": "o"
|
|
82
|
-
# - "o" # General use
|
|
83
|
-
# - "ô" # For place names
|
|
84
|
-
"ᠤ": "u"
|
|
85
|
-
# - "u" # General use
|
|
86
|
-
# - "û" # For place names
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
# @TODO Exceptional
|
|
90
|
-
#
|
|
91
|
-
# This is failing the whole test suite, but as far as I understood
|
|
92
|
-
# from the comment, this city name is exceptional, so we are temporarliy
|
|
93
|
-
# adding it as execeptional rules for now.
|
|
94
|
-
#
|
|
95
|
-
# But, we will need some natives attension to help us out here, and maybe
|
|
96
|
-
# come up with some basic rules for this exceptional pattern.
|
|
97
|
-
#
|
|
98
|
-
|
|
99
|
-
"ᠬᠥᠬᠡᠬᠣᠲᠠ": "kökeqota"
|
|
@@ -1,163 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: ungegn
|
|
3
|
-
id: 1972
|
|
4
|
-
language: nep
|
|
5
|
-
source_script: Deva
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Nepali Romanization, 1972
|
|
8
|
-
url: https://www.eki.ee/wgrs/v3_0/rom1_ne.pdf
|
|
9
|
-
creation_date: 1972
|
|
10
|
-
confirmation_date: 2010
|
|
11
|
-
description: |
|
|
12
|
-
The United Nations recommended system was approved in 1972 (II/11), based on a report
|
|
13
|
-
prepared by D. N. Sharma. The note on the system was published in volume II of the
|
|
14
|
-
conference report.
|
|
15
|
-
|
|
16
|
-
There is no evidence of the use of the system either in Nepal or in international cartographic
|
|
17
|
-
products. The resolution IV/17 (1982) recommended association, inter alia, with Nepal in
|
|
18
|
-
carrying out further studies on the system. In Nepal a system of romanization is employed by
|
|
19
|
-
the Nepal Survey Department (NSD). This system has been applied to names appearing on
|
|
20
|
-
national mapping, and it is also used in the Geographic Information Infrastructure Programme
|
|
21
|
-
(NGIIP).
|
|
22
|
-
|
|
23
|
-
Nepali (Nepālī) uses the alphasyllabic script Devanāgarī.
|
|
24
|
-
|
|
25
|
-
notes:
|
|
26
|
-
|
|
27
|
-
- In normal spelling ṙ and ṙh are not marked, instead dotless ड ḍa, ढ ḍha are used to denote these sounds.
|
|
28
|
-
- |
|
|
29
|
-
Ligatures may be formed with r as the first component: ~ह rha.
|
|
30
|
-
|
|
31
|
-
tests:
|
|
32
|
-
- source: "लेखन"
|
|
33
|
-
expected: "laekhana"
|
|
34
|
-
- source: "मुद्रा"
|
|
35
|
-
expected: "maudaaraā"
|
|
36
|
-
- source: "प्रशंसा"
|
|
37
|
-
expected: "paarashaṁsaā"
|
|
38
|
-
- source: "अंक"
|
|
39
|
-
expected: "aṁka"
|
|
40
|
-
- source: "नेकपाले स्थगित स्थायी कमिटीको बैठक भदौ गते बोलाउने भएको"
|
|
41
|
-
expected: "naekapaālae saathagaita saathaāyaī kamaiṭaīkao baaiṭhaka bhadaau gatae baolaāunae bhaekao"
|
|
42
|
-
- source: "न घर रह्यो, न परिवार"
|
|
43
|
-
expected: "na ghara rahaayao, na paraivaāra"
|
|
44
|
-
- source: "ढोरपाटनमा भुजीखोला बाढीपहिरोले अभिभावक गुमाएका बालबालिकाको बिचल्ली"
|
|
45
|
-
expected: "ḍhaorapaāṭanamaā bhaujaīkhaolaā baāḍhaīpahairaolae abhaibhaāvaka gaumaāekaā baālabaālaikaākao baichalaalaī"
|
|
46
|
-
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
|
47
|
-
expected: "sausaamaitaākaā kaākaā haemabahaādaura ra kaākaīlaāī panai pahairaolae bagaāyao"
|
|
48
|
-
- source: "संविधान जारी भएसँगै सार्वजनिक प्रशासनमा नयाँ उत्साह आउने अपेक्षा थियो"
|
|
49
|
-
expected: "saṁvaidhaāna jaāraī bhaesam̐gaai saāraavajanaika paarashaāsanamaā nayaām̐ utaasaāha āunae apaekaaṣhaā thaiyao"
|
|
50
|
-
- source: "देशमा कोरोना संक्रमित र मृतकको संख्या हरेक दिन बढ्दो छ"
|
|
51
|
-
expected: "daeshamaā kaoraonaā saṁkaaramaita ra maṛtakakao saṁkhaayaā haraeka daina baḍhaadao chha"
|
|
52
|
-
- source: "गाउँपालिकाका अध्यक्ष टिका गुरुङका अनुसार विष्णुदासलाई राजुले सुत्नका लागि बेलुका साथी लगेका थिए"
|
|
53
|
-
expected: "gaāum̐paālaikaākaā adhaayakaaṣha ṭaikaā gaurauṅakaā anausaāra vaiṣhaaṇaudaāsalaāī raājaulae sautaanakaā laāgai baelaukaā saāthaī lagaekaā thaie"
|
|
54
|
-
- source: "यो आयोजना गाउँपालिकाको केन्द्र तेल्लोकमा पर्छ"
|
|
55
|
-
expected: "yao āyaojanaā gaāum̐paālaikaākao kaenaadaara taelaalaokamaā paraachha"
|
|
56
|
-
- source: "सुस्मिताका काका हेमबहादुर र काकीलाई पनि पहिरोले बगायो"
|
|
57
|
-
expected: "sausaamaitaākaā kaākaā haemabahaādaura ra kaākaīlaāī panai pahairaolae bagaāyao"
|
|
58
|
-
- source: "चैत पहिलो साता घर आएका उनी लकडाउन भएपछि यतै रोकिए"
|
|
59
|
-
expected: "chaaita pahailao saātaā ghara āekaā unaī lakaḍaāuna bhaepachhai yataai raokaie"
|
|
60
|
-
- source: "काम गर्न जानेको हकमा रोजगारदाता कम्पनीको पत्रसँगै वडा र जिल्ला प्रशासनको सिफारिस अनिवार्य गरिएको छ"
|
|
61
|
-
expected: "kaāma garaana jaānaekao hakamaā raojagaāradaātaā kamaapanaīkao pataarasam̐gaai vaḍaā ra jailaalaā paarashaāsanakao saiphaāraisa anaivaāraaya garaiekao chha"
|
|
62
|
-
|
|
63
|
-
map:
|
|
64
|
-
|
|
65
|
-
characters:
|
|
66
|
-
|
|
67
|
-
# Vowels and Diphthongs
|
|
68
|
-
'अ': 'a'
|
|
69
|
-
'आ': 'ā'
|
|
70
|
-
'इ': 'i'
|
|
71
|
-
'ई': 'ī'
|
|
72
|
-
'उ': 'u'
|
|
73
|
-
'ऊ': 'ū'
|
|
74
|
-
'ऋ': 'ṛ'
|
|
75
|
-
'ॠ': 'ṝ'
|
|
76
|
-
'ऌ': 'l̤'
|
|
77
|
-
'ए': 'e'
|
|
78
|
-
'ऐ': 'ai'
|
|
79
|
-
'ओ': 'o'
|
|
80
|
-
'औ': 'au'
|
|
81
|
-
|
|
82
|
-
# Medials # Needed for connecting constants
|
|
83
|
-
|
|
84
|
-
'ा': "ā"
|
|
85
|
-
'ि': "i"
|
|
86
|
-
'ी': "ī"
|
|
87
|
-
'ु': "u"
|
|
88
|
-
'ू': "ū"
|
|
89
|
-
'ृ': "ṛ"
|
|
90
|
-
'े': "e"
|
|
91
|
-
'ै': "ai"
|
|
92
|
-
'ो': "o"
|
|
93
|
-
'ौ': "au"
|
|
94
|
-
|
|
95
|
-
# Consonants (see Note 1)
|
|
96
|
-
|
|
97
|
-
# Gutturals
|
|
98
|
-
'क': 'ka'
|
|
99
|
-
'ख': 'kha'
|
|
100
|
-
'ग': 'ga'
|
|
101
|
-
'घ': 'gha'
|
|
102
|
-
'ङ': 'ṅa'
|
|
103
|
-
|
|
104
|
-
# Palatals
|
|
105
|
-
'च': 'cha'
|
|
106
|
-
'छ': 'chha'
|
|
107
|
-
'ज': 'ja'
|
|
108
|
-
'झ': 'jha'
|
|
109
|
-
'ञ': 'ña'
|
|
110
|
-
|
|
111
|
-
# Cerebrals
|
|
112
|
-
'ट': 'ṭa'
|
|
113
|
-
'ठ': 'ṭha'
|
|
114
|
-
'ड': 'ḍa'
|
|
115
|
-
'ढ': 'ḍha'
|
|
116
|
-
'ण': 'ṇa'
|
|
117
|
-
|
|
118
|
-
# Dentals
|
|
119
|
-
'त': 'ta'
|
|
120
|
-
'थ': 'tha'
|
|
121
|
-
'द': 'da'
|
|
122
|
-
'ध': 'dha'
|
|
123
|
-
'न': 'na'
|
|
124
|
-
|
|
125
|
-
# Labials
|
|
126
|
-
'प': 'pa'
|
|
127
|
-
'फ': 'pha'
|
|
128
|
-
'ब': 'ba'
|
|
129
|
-
'भ': 'bha'
|
|
130
|
-
'म': 'ma'
|
|
131
|
-
|
|
132
|
-
# Semivowels
|
|
133
|
-
'य': 'ya'
|
|
134
|
-
'र': 'ra'
|
|
135
|
-
'ल': 'la'
|
|
136
|
-
'व': 'va' # or wa [Note#3]
|
|
137
|
-
|
|
138
|
-
# Sibilants
|
|
139
|
-
'श': 'sha'
|
|
140
|
-
'ष': 'ṣha'
|
|
141
|
-
'स': 'sa'
|
|
142
|
-
|
|
143
|
-
# Dotted variants
|
|
144
|
-
'क़': qa
|
|
145
|
-
'ख़': ḳha
|
|
146
|
-
'ग़': ga
|
|
147
|
-
'ज़': za
|
|
148
|
-
'ड़': ṙa
|
|
149
|
-
'ढ़': ṙha
|
|
150
|
-
'फ़': fa
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
# Aspirate
|
|
154
|
-
'ह': 'ha'
|
|
155
|
-
|
|
156
|
-
# Anusvāra
|
|
157
|
-
'ं': 'ṁ'
|
|
158
|
-
|
|
159
|
-
# Anunāsika
|
|
160
|
-
'ँ': 'm̐'
|
|
161
|
-
|
|
162
|
-
# halanta
|
|
163
|
-
'्': 'a'
|
|
@@ -1,166 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: ungegn
|
|
3
|
-
id: 1987
|
|
4
|
-
language: rus
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: REPORT ON THE CURRENT STATUS OF UNITED NATIONS ROMANIZATION SYSTEMS FOR GEOGRAPHICAL NAMES -- Russian Romanization system
|
|
8
|
-
url: http://www.eki.ee/wgrs/rom1_ru.htm
|
|
9
|
-
creation_date: 1987
|
|
10
|
-
confirmation_date: 2016
|
|
11
|
-
description: |
|
|
12
|
-
The United Nations recommended system was approved in 1987 (V/18),
|
|
13
|
-
based on the official system of the Main Administration of Geodesy and
|
|
14
|
-
Cartography of the former Soviet Union, also known as the GOST 1983
|
|
15
|
-
system (GOST 16876-71). The table was published as an annex to the
|
|
16
|
-
resolution.
|
|
17
|
-
|
|
18
|
-
The system is used in the Russian Federation and increasingly in
|
|
19
|
-
international cartographic products.
|
|
20
|
-
|
|
21
|
-
Russian uses the Cyrillic script which is alphabetic. The
|
|
22
|
-
romanization table is unambiguous and can be applied automatically. The
|
|
23
|
-
system is reversible, although rarely there can be ambiguities.
|
|
24
|
-
|
|
25
|
-
notes:
|
|
26
|
-
- "Cursive forms of some characters might be formed differently: Аа Бб
|
|
27
|
-
Вв Гг Дд Ее Ёё Жж Зз Ии Йй Кк Лл Мм Нн Оо Пп Рр Сс Тт Уу Фф Хх Цц Чч Шш
|
|
28
|
-
Щщ Ъъ Ыы Ьь Ээ Юю Яя."
|
|
29
|
-
|
|
30
|
-
- Fifth United Nations Conference on the Standardization of
|
|
31
|
-
Geographical Names. Montreal, 18–31 August 1987. Vol. I. Report of the
|
|
32
|
-
Conference, pp. 40–41.
|
|
33
|
-
|
|
34
|
-
tests:
|
|
35
|
-
- source: Aнaпa
|
|
36
|
-
expected: Anapa
|
|
37
|
-
|
|
38
|
-
- source: Бaбушкин
|
|
39
|
-
expected: Babuškin
|
|
40
|
-
|
|
41
|
-
- source: Вaвилово
|
|
42
|
-
expected: Vavilovo
|
|
43
|
-
|
|
44
|
-
- source: Гaгaрин
|
|
45
|
-
expected: Gagarin
|
|
46
|
-
|
|
47
|
-
- source: Дудинкa
|
|
48
|
-
expected: Dudinka
|
|
49
|
-
|
|
50
|
-
- source: Елисeeвкa
|
|
51
|
-
expected: Eliseevka
|
|
52
|
-
|
|
53
|
-
- source: Ёлкино
|
|
54
|
-
expected: "\u00CBlkino"
|
|
55
|
-
|
|
56
|
-
- source: Псëл
|
|
57
|
-
expected: Psël
|
|
58
|
-
|
|
59
|
-
- source: Жужa
|
|
60
|
-
expected: Žuža
|
|
61
|
-
|
|
62
|
-
- source: Звëздный
|
|
63
|
-
expected: Zvëzdnyj
|
|
64
|
-
|
|
65
|
-
- source: Идрицa
|
|
66
|
-
expected: Idrica
|
|
67
|
-
|
|
68
|
-
- source: Зaрaйск
|
|
69
|
-
expected: Zarajsk
|
|
70
|
-
|
|
71
|
-
- source: Кокaнд
|
|
72
|
-
expected: Kokand
|
|
73
|
-
|
|
74
|
-
- source: Лaлвaр
|
|
75
|
-
expected: Lalvar
|
|
76
|
-
|
|
77
|
-
- source: Мaймaк
|
|
78
|
-
expected: Majmak
|
|
79
|
-
|
|
80
|
-
- source: Нeжин
|
|
81
|
-
expected: Nežin
|
|
82
|
-
|
|
83
|
-
- source: Обoдoвкa
|
|
84
|
-
expected: Obodovka
|
|
85
|
-
|
|
86
|
-
- source: Пaп
|
|
87
|
-
expected: Pap
|
|
88
|
-
|
|
89
|
-
- source: Рeбрихa
|
|
90
|
-
expected: Rebriha
|
|
91
|
-
|
|
92
|
-
- source: Сaсoвo
|
|
93
|
-
expected: Sasovo
|
|
94
|
-
|
|
95
|
-
- source: Тaттa
|
|
96
|
-
expected: Tatta
|
|
97
|
-
|
|
98
|
-
- source: Уржум
|
|
99
|
-
expected: Uržum
|
|
100
|
-
|
|
101
|
-
- source: Фoфaнoвo
|
|
102
|
-
expected: Fofanovo
|
|
103
|
-
|
|
104
|
-
- source: Хoхломa
|
|
105
|
-
expected: Hohloma
|
|
106
|
-
|
|
107
|
-
- source: Цвeткoвo
|
|
108
|
-
expected: Cvetkovo
|
|
109
|
-
|
|
110
|
-
- source: Чeчeльник
|
|
111
|
-
expected: Čečel’nik
|
|
112
|
-
|
|
113
|
-
- source: Шишкинo
|
|
114
|
-
expected: Šiškino
|
|
115
|
-
|
|
116
|
-
- source: Щукинo
|
|
117
|
-
expected: Ščukino
|
|
118
|
-
|
|
119
|
-
- source: Пoдъячeвo
|
|
120
|
-
expected: Pod”jačevo
|
|
121
|
-
|
|
122
|
-
- source: Ыныкчaнский
|
|
123
|
-
expected: Ynykčanskij
|
|
124
|
-
|
|
125
|
-
- source: Пaрaньгa
|
|
126
|
-
expected: Paran’ga
|
|
127
|
-
|
|
128
|
-
- source: Кaзaнь
|
|
129
|
-
expected: Kazan’
|
|
130
|
-
|
|
131
|
-
- source: Щучьe
|
|
132
|
-
expected: Ščuč’e
|
|
133
|
-
|
|
134
|
-
- source: Элистa
|
|
135
|
-
expected: Èlista
|
|
136
|
-
|
|
137
|
-
- source: Юринo
|
|
138
|
-
expected: Jurino
|
|
139
|
-
|
|
140
|
-
- source: Юхнoв
|
|
141
|
-
expected: Juhnov
|
|
142
|
-
|
|
143
|
-
- source: Юрюзaнь
|
|
144
|
-
expected: Jurjuzan’
|
|
145
|
-
|
|
146
|
-
- source: Ямaл
|
|
147
|
-
expected: Jamal
|
|
148
|
-
|
|
149
|
-
- source: Язъявaн
|
|
150
|
-
expected: Jaz”javan
|
|
151
|
-
|
|
152
|
-
- source: Яя
|
|
153
|
-
expected: Jaja
|
|
154
|
-
|
|
155
|
-
- source: Вязьмa
|
|
156
|
-
expected: Vjaz’ma
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
map:
|
|
160
|
-
inherit: gost-rus-Cyrl-Latn-16876-71-1983
|
|
161
|
-
|
|
162
|
-
characters:
|
|
163
|
-
'\u042A' : '”' # Ъ
|
|
164
|
-
'\u042C' : '’' # Ь
|
|
165
|
-
'\u044A' : '”' # ъ
|
|
166
|
-
'\u044C' : '’' # ь
|
|
@@ -1,30 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
authority_id: un
|
|
3
|
-
id: 1998
|
|
4
|
-
language: ukr
|
|
5
|
-
source_script: Cyrl
|
|
6
|
-
destination_script: Latn
|
|
7
|
-
name: ROMANIZATION SYSTEM FOR BELARUSIAN, RUSSIAN AND UKRAINIAN CYRILLIC
|
|
8
|
-
url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/7th-uncsgn-docs/econf/7th_UNCSGN_econf.91_3_Add1.pdf
|
|
9
|
-
creation_date: 1998
|
|
10
|
-
|
|
11
|
-
tests:
|
|
12
|
-
|
|
13
|
-
map:
|
|
14
|
-
inherit: gost-rus-Cyrl-Latn-16876-71-1983
|
|
15
|
-
|
|
16
|
-
characters:
|
|
17
|
-
'\u0490' : '?' # Ґ
|
|
18
|
-
'\u0491' : '?' # ґ
|
|
19
|
-
|
|
20
|
-
'\u0404' : "Je" # Є
|
|
21
|
-
'\u0454' : "je" # є
|
|
22
|
-
|
|
23
|
-
'\u0406' : 'I' # І
|
|
24
|
-
'\u0456' : 'i' # і
|
|
25
|
-
|
|
26
|
-
'\u0407' : 'I' # Ї
|
|
27
|
-
'\u0457' : 'i' # ї
|
|
28
|
-
|
|
29
|
-
'\u2019' : '?'
|
|
30
|
-
"'" : '?'
|