interscript-maps 2.2.0 → 2.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
|
@@ -4,14 +4,14 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:isl
|
|
5
5
|
source_script: Latn
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Transliteration of Icelandic (1947)
|
|
8
8
|
url: https://github.com/interscript/interscript/files/5180785/BGN_Romanization_Guide_1964_icelandic_1947.pdf
|
|
9
9
|
creation_date: 1964
|
|
10
10
|
description: |
|
|
11
11
|
The BGN and the PCGn in 1947 jointly agreed to the transliteration of two letters of the Icelandic alphabet which,
|
|
12
12
|
although used in writing Old English, have disappeared from the modern English alphabet.
|
|
13
13
|
|
|
14
|
-
The transliterated letters are the edh (Ð ð) and the thorn (Þ þ),
|
|
14
|
+
The transliterated letters are the edh (Ð ð) and the thorn (Þ þ), pronounced as th in "thus" and th in "think," respectively.
|
|
15
15
|
|
|
16
16
|
It was felt that it was better to transliterate these letters into familiar symbols than preserve such unfamiliar letters in the nomenclature.
|
|
17
17
|
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:isl
|
|
5
5
|
source_script: Latn
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Roman-Script Spelling Convention of Icelandic (1968 Agreement)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693794/ROMAN-SCRIPT_SPELLING_CONVENTIONS.pdf
|
|
9
9
|
creation_date: 1968
|
|
10
10
|
|
|
@@ -4,13 +4,13 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kat
|
|
5
5
|
source_script: Geor
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Georgian (1981)
|
|
8
8
|
url: https://transliteration.eki.ee/pdf/Georgian.pdf
|
|
9
9
|
creation_date: 1981
|
|
10
10
|
confirmation_date: 1981
|
|
11
11
|
description: |
|
|
12
12
|
BGN/PCGN system of 1981.
|
|
13
|
-
|
|
13
|
+
|
|
14
14
|
notes:
|
|
15
15
|
}
|
|
16
16
|
|
|
@@ -75,18 +75,18 @@ stage {
|
|
|
75
75
|
sub "\u10d4", "e" # ე
|
|
76
76
|
sub "\u10d5", "v" # ვ
|
|
77
77
|
sub "\u10d6", "z" # ზ
|
|
78
|
-
|
|
78
|
+
|
|
79
79
|
sub "\u10f1", "ey" # ჱ
|
|
80
|
-
|
|
80
|
+
|
|
81
81
|
sub "\u10d7", "t’" # თ
|
|
82
82
|
sub "\u10d8", "i" # ი
|
|
83
83
|
sub "\u10d9", "k’" # კ
|
|
84
84
|
sub "\u10da", "l" # ლ
|
|
85
85
|
sub "\u10db", "m" # მ
|
|
86
86
|
sub "\u10dc", "n" # ნ
|
|
87
|
-
|
|
87
|
+
|
|
88
88
|
sub "\u10f2", "j" # ჲ
|
|
89
|
-
|
|
89
|
+
|
|
90
90
|
sub "\u10dd", "o" # ო
|
|
91
91
|
sub "\u10de", "p" # პ
|
|
92
92
|
sub "\u10df", "zh" # ჟ
|
|
@@ -105,9 +105,9 @@ stage {
|
|
|
105
105
|
sub "\u10ec", "ts" # წ
|
|
106
106
|
sub "\u10ed", "ch" # ჭ
|
|
107
107
|
sub "\u10ee", "kh" # ხ
|
|
108
|
-
|
|
108
|
+
|
|
109
109
|
sub "\u10f4", "q’" # ჴ
|
|
110
|
-
|
|
110
|
+
|
|
111
111
|
sub "\u10ef", "j" # ჯ
|
|
112
112
|
sub "\u10f0", "h" # ჰ
|
|
113
113
|
}
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kat
|
|
5
5
|
source_script: Geor
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Georgian (2009 Agreement, Georgia 2011 national system)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/810202/ROMANIZATION_OF_GEORGIAN.pdf
|
|
9
9
|
creation_date: 2009
|
|
10
10
|
confirmation_date: 2011
|
|
@@ -16,7 +16,7 @@ metadata {
|
|
|
16
16
|
the Mkhedruli alphabet, as presently used in Georgia. This system was
|
|
17
17
|
adopted by BGN and PCGN in 2009, superseding the BGN/PCGN system of
|
|
18
18
|
1981.
|
|
19
|
-
|
|
19
|
+
|
|
20
20
|
notes:
|
|
21
21
|
- This system denotes ejective (glottalised) consonants by means of
|
|
22
22
|
an apostrophe. The BGN/PCGN 1981 system instead used the apostrophe to
|
|
@@ -1,18 +1,18 @@
|
|
|
1
1
|
metadata {
|
|
2
|
-
|
|
2
|
+
|
|
3
3
|
authority_id: bgnpcgn
|
|
4
4
|
id: 1979
|
|
5
5
|
language: iso-639-2:kaz
|
|
6
6
|
source_script: Cyrl
|
|
7
7
|
destination_script: Latn
|
|
8
|
-
name: Romanization of Kazakh
|
|
8
|
+
name: Romanization of Kazakh (1979)
|
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811511/ROMANIZATION_OF_KAZAKH.pdf
|
|
10
10
|
creation_date: 1979
|
|
11
11
|
confirmation_date: 2019
|
|
12
12
|
description: |
|
|
13
13
|
The BGN/PCGN system for Kazakh was designed for use in romanizing names written in the Kazakh Cyrillic alphabet.
|
|
14
14
|
The Kazakh Cyrillic alphabet contains nine characters not present in the Russian alphabet: ә, ғ, қ, ң, ө, ұ, ү, һ and і.
|
|
15
|
-
|
|
15
|
+
|
|
16
16
|
notes:
|
|
17
17
|
- The character sequences гһ, зһ, кһ, нг, сһ and цһ may be romanized g·h, z·h, k·h, n·g, s·h
|
|
18
18
|
and ts·h in order to differentiate those romanizations from from the digraphs gh, zh, kh, ng, sh,
|
|
@@ -144,7 +144,7 @@ stage {
|
|
|
144
144
|
sub "\u042D", "Ė" # Э
|
|
145
145
|
sub "\u042E", "Yu" # Ю
|
|
146
146
|
sub "\u042F", "Ya" # Я
|
|
147
|
-
|
|
147
|
+
|
|
148
148
|
sub "\u0430", "a" # а
|
|
149
149
|
sub "\u04D9", "ä" # ә
|
|
150
150
|
sub "\u0431", "b" # б
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kir
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: Romanization of Kyrgyz
|
|
7
|
+
name: Romanization of Kyrgyz (1979)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816663/ROMANIZATION_OF_KYRGYZ.pdf
|
|
9
9
|
creation_date: 1979
|
|
10
10
|
confirmation_date: 2019
|
|
@@ -12,7 +12,7 @@ metadata {
|
|
|
12
12
|
The BGN/PCGN system for Kyrgyz Cyrillic was designed for use in romanizing names written
|
|
13
13
|
in the Kyrgyz Cyrillic alphabet. The Kyrgyz Cyrillic alphabet contains three characters not present in
|
|
14
14
|
the Russian alphabet: Ң , Ө, and Y.
|
|
15
|
-
|
|
15
|
+
|
|
16
16
|
notes:
|
|
17
17
|
- Both Kyrgyz and Kirghiz may frequently be seen as the language name; both these spellings are used in the
|
|
18
18
|
ISO 639 Standard on the representation of names for languages.
|
|
@@ -127,7 +127,7 @@ stage {
|
|
|
127
127
|
sub "\u042D", "E" # Э
|
|
128
128
|
sub "\u042E", "Yu" # Ю
|
|
129
129
|
sub "\u042F", "Ya" # Я
|
|
130
|
-
|
|
130
|
+
|
|
131
131
|
sub "\u0430", "a" # а
|
|
132
132
|
sub "\u0431", "b" # б
|
|
133
133
|
sub "\u0432", "v" # в
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kor
|
|
5
5
|
source_script: Hang
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Korean -- For DPRK (Hangul to Latin) (1945 Agreement)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693725/ROMANIZATION_OF_KOREAN-_MR_for_DPRK.pdf
|
|
9
9
|
creation_date: 1945
|
|
10
10
|
adoption_date:
|
|
@@ -4,10 +4,10 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kor
|
|
5
5
|
source_script: Hang
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: Ministry of Culture and Tourism System (2000)
|
|
8
|
-
url:
|
|
9
|
-
creation_date:
|
|
10
|
-
adoption_date:
|
|
7
|
+
name: Romanization of Korean -- For the ROK (2011 Agreement, Ministry of Culture and Tourism System (2000))
|
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693724/ROMANIZATION_OF_KOREAN-__MOCT_for_ROK.pdf
|
|
9
|
+
creation_date: 2011
|
|
10
|
+
adoption_date: 2011
|
|
11
11
|
description:
|
|
12
12
|
|
|
13
13
|
notes:
|
|
@@ -4,10 +4,11 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kor
|
|
5
5
|
source_script: Kore
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: Ministry of Culture and Tourism System (2000)
|
|
7
|
+
name: Romanization of Korean -- For the ROK -- Korean to Latin (2011 Agreement, Ministry of Culture and Tourism System (2000))
|
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693724/ROMANIZATION_OF_KOREAN-__MOCT_for_ROK.pdf
|
|
8
9
|
url: ""
|
|
9
|
-
creation_date:
|
|
10
|
-
adoption_date:
|
|
10
|
+
creation_date: 2011
|
|
11
|
+
adoption_date: 2011
|
|
11
12
|
description: |
|
|
12
13
|
Establishes a system for the transliteration of the characters of Korean script into Latin characters.
|
|
13
14
|
Intended to provide a means for international communication of written documents.
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: kur
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Kurdish (2007)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693727/ROMANIZATION_OF_KURDISH.pdf
|
|
9
9
|
creation_date: 2007
|
|
10
10
|
confirmation_date: 2017-12
|
|
@@ -4,10 +4,10 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mkd
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization for Macedonian (1981)
|
|
8
8
|
url: https://github.com/riboseinc/interscript/files/4247920/USBGN_romanization_Macedonian_1981.pdf
|
|
9
9
|
creation_date: 1981
|
|
10
|
-
description: BGN/PCGN Romanization table for
|
|
10
|
+
description: BGN/PCGN Romanization table for Macedonian.
|
|
11
11
|
|
|
12
12
|
notes:
|
|
13
13
|
- The character ѓ should be romanized g when it occurs before е and и. In other
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mkd
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization for Macedonian (2013)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
|
|
9
9
|
creation_date: 2013
|
|
10
10
|
description: |
|
|
@@ -4,10 +4,10 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mon
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Mongolian (1964)
|
|
8
8
|
url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
|
|
9
|
-
creation_date:
|
|
10
|
-
confirmation_date:
|
|
9
|
+
creation_date: 1964
|
|
10
|
+
confirmation_date: 1964
|
|
11
11
|
description: |
|
|
12
12
|
This system was originated by the PCGN in 1957 and adopted as a
|
|
13
13
|
BGN/PCGN System in 1964. It is intended for use in the romanization of
|
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
metadata {
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
|
-
id:
|
|
3
|
+
id: 2011
|
|
4
4
|
language: iso-639-2:nep
|
|
5
5
|
source_script: Deva
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: Nepali
|
|
7
|
+
name: Romanization for Nepali (2011 Agreement)
|
|
8
8
|
url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20NEPALI.pdf
|
|
9
|
-
creation_date:
|
|
9
|
+
creation_date: 2011
|
|
10
|
+
confirmation_date: 2017
|
|
10
11
|
description: |
|
|
11
|
-
BGN/PCGN 2011 Agreement Romanization of Nepali
|
|
12
12
|
The BGN and the PCGN have adopted the Nepal Survey Department (NSD) system for the
|
|
13
13
|
romanization of Nepali names. This system, below, should be applied to Nepali names for which Roman‐
|
|
14
14
|
script spellings in materials produced by the government of Nepal are not available.
|
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
metadata {
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
|
-
id:
|
|
3
|
+
id: 1958
|
|
4
4
|
language: iso-639-3:prs
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
|
6
6
|
source_script: Arab
|
|
7
7
|
destination_script: Latn
|
|
8
|
-
name:
|
|
8
|
+
name: Transliteration System for Persian (1958)
|
|
9
9
|
url: https://github.com/interscript/interscript/files/5180821/BGN_Romanization_Guide_1964_persian_1958.pdf
|
|
10
10
|
creation_date: 1958
|
|
11
|
-
confirmation_date:
|
|
11
|
+
confirmation_date: 1958
|
|
12
12
|
description: |
|
|
13
13
|
The BGN/PCGN 1958 System for the Persian alphabet was
|
|
14
14
|
adopted by the BGN in 1946 and by the PCGN In 1958. It Is
|
|
@@ -30,11 +30,11 @@ metadata {
|
|
|
30
30
|
Arabic in that the short vowel symbols necessary for the
|
|
31
31
|
proper rendering of short vowels, long vowels, and
|
|
32
32
|
diphthongs are almost always omitted from written Persian.
|
|
33
|
-
It follows that, in order to produce
|
|
33
|
+
It follows that, in order to produce transliterations in
|
|
34
34
|
terms of standard written Persian, the transliterator must
|
|
35
35
|
be able to identify the words used in names and must know
|
|
36
36
|
their standard written Persian spelling, their proper vowel
|
|
37
|
-
pointing, and how to eliminate
|
|
37
|
+
pointing, and how to eliminate peculiarities due to
|
|
38
38
|
dialectical variation.
|
|
39
39
|
The notes and special rules explain details of
|
|
40
40
|
transliteration not stated in the tables.
|
|
@@ -240,20 +240,20 @@ stage {
|
|
|
240
240
|
# '\uFE8E' : '' # ﺎ
|
|
241
241
|
|
|
242
242
|
# Sun letters
|
|
243
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
|
244
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
|
245
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
|
246
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
|
247
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
|
248
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
|
249
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
|
250
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
|
251
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
|
252
|
-
sub boundary + "\u0627\u0644\u0636", "aẕ ẕ" # الض
|
|
253
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
|
254
|
-
sub boundary + "\u0627\u0644\u0638", "az̧ z̧" # الظ
|
|
255
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
|
256
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
|
243
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
|
244
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
|
245
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
|
246
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
|
247
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
|
248
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
|
249
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
|
250
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
|
251
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
|
252
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aẕ ẕ" # الض
|
|
253
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
|
254
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az̧ z̧" # الظ
|
|
255
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
|
256
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
|
257
257
|
|
|
258
258
|
|
|
259
259
|
sub "\u0621", "’" # ء
|
|
@@ -5,7 +5,7 @@ metadata {
|
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
|
6
6
|
source_script: Arab
|
|
7
7
|
destination_script: Latn
|
|
8
|
-
name:
|
|
8
|
+
name: National Romanization System for Afghanistan (2007)
|
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693661/ROMANIZATION_FOR_AFGHANISTAN.pdf
|
|
10
10
|
creation_date: 2007
|
|
11
11
|
confirmation_date: 2017-11
|
|
@@ -461,20 +461,20 @@ stage {
|
|
|
461
461
|
# '\uFE8E' : '' # ﺎ
|
|
462
462
|
|
|
463
463
|
# Sun letters
|
|
464
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
|
465
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
|
466
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
|
467
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
|
468
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
|
469
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
|
470
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
|
471
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
|
472
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
|
473
|
-
sub boundary + "\u0627\u0644\u0636", "aẕ ẕ" # الض
|
|
474
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
|
475
|
-
sub boundary + "\u0627\u0644\u0638", "az̧ z̧" # الظ
|
|
476
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
|
477
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
|
464
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
|
465
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
|
466
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
|
467
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
|
468
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
|
469
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
|
470
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
|
471
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
|
472
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
|
473
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aẕ ẕ" # الض
|
|
474
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
|
475
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az̧ z̧" # الظ
|
|
476
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
|
477
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
|
478
478
|
|
|
479
479
|
|
|
480
480
|
# consonant characters
|
|
@@ -5,7 +5,7 @@ metadata {
|
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
|
6
6
|
source_script: Arab
|
|
7
7
|
destination_script: Latn
|
|
8
|
-
name:
|
|
8
|
+
name: National Romanization System for Afghanistan -- Yaghoubi (2007)
|
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693661/ROMANIZATION_FOR_AFGHANISTAN.pdf
|
|
10
10
|
creation_date: 2007
|
|
11
11
|
confirmation_date: 2017-11
|
|
@@ -379,20 +379,20 @@ stage {
|
|
|
379
379
|
|
|
380
380
|
|
|
381
381
|
# Sun letters
|
|
382
|
-
sub boundary + "\u0627\u0644\u062a", "at̄ t̄" # الت
|
|
383
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
|
384
|
-
sub boundary + "\u0627\u0644\u062f", "aḏ ḏ" # الد
|
|
385
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
|
386
|
-
sub boundary + "\u0627\u0644\u0631", "aṟ ṟ" # الر
|
|
387
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
|
388
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
|
389
|
-
sub boundary + "\u0627\u0644\u0634", "aš š" # الش
|
|
390
|
-
sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
|
|
391
|
-
sub boundary + "\u0627\u0644\u0636", "ad͟z d͟z" # الض
|
|
392
|
-
sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
|
|
393
|
-
sub boundary + "\u0627\u0644\u0638", "aẕ ẕ" # الظ
|
|
394
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
|
395
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
|
382
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at̄ t̄" # الت
|
|
383
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
|
384
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "aḏ ḏ" # الد
|
|
385
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
|
386
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "aṟ ṟ" # الر
|
|
387
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
|
388
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
|
389
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "aš š" # الش
|
|
390
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
|
|
391
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "ad͟z d͟z" # الض
|
|
392
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
|
|
393
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "aẕ ẕ" # الظ
|
|
394
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
|
395
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
|
396
396
|
|
|
397
397
|
# consonant characters
|
|
398
398
|
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
metadata {
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
|
-
id:
|
|
3
|
+
id: 1968
|
|
4
4
|
language: iso-639-3:prs
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Pashto (1968)
|
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693760/ROMANIZATION_OF_PASHTO.pdf
|
|
9
9
|
creation_date: 1968
|
|
10
10
|
confirmation_date: 2017-11
|
|
@@ -248,20 +248,20 @@ stage {
|
|
|
248
248
|
sub "\u0659", "ê"
|
|
249
249
|
|
|
250
250
|
# Sun letters
|
|
251
|
-
sub boundary + "\u0627\u0644\u062a", "ut t" # الت
|
|
252
|
-
sub boundary + "\u0627\u0644\u062b", "us̄ s̄" # الث
|
|
253
|
-
sub boundary + "\u0627\u0644\u062f", "ud d" # الد
|
|
254
|
-
sub boundary + "\u0627\u0644\u0630", "uz̄ z̄" # الذ
|
|
255
|
-
sub boundary + "\u0627\u0644\u0631", "ur r" # الر
|
|
256
|
-
sub boundary + "\u0627\u0644\u0632", "uz z" # الز
|
|
257
|
-
sub boundary + "\u0627\u0644\u0633", "us s" # الس
|
|
258
|
-
sub boundary + "\u0627\u0644\u0634", "ush sh" # الش
|
|
259
|
-
sub boundary + "\u0627\u0644\u0635", "uş ş" # الص
|
|
260
|
-
sub boundary + "\u0627\u0644\u0636", "uẕ ẕ" # الض
|
|
261
|
-
sub boundary + "\u0627\u0644\u0637", "uţ ţ" # الط
|
|
262
|
-
sub boundary + "\u0627\u0644\u0638", "uz̧ z̧" # الظ
|
|
263
|
-
sub boundary + "\u0627\u0644\u0644", "ul l" # الل
|
|
264
|
-
sub boundary + "\u0627\u0644\u0646", "un n" # الن
|
|
251
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ut t" # الت
|
|
252
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "us̄ s̄" # الث
|
|
253
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ud d" # الد
|
|
254
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "uz̄ z̄" # الذ
|
|
255
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ur r" # الر
|
|
256
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "uz z" # الز
|
|
257
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "us s" # الس
|
|
258
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ush sh" # الش
|
|
259
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "uş ş" # الص
|
|
260
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "uẕ ẕ" # الض
|
|
261
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "uţ ţ" # الط
|
|
262
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "uz̧ z̧" # الظ
|
|
263
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ul l" # الل
|
|
264
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "un n" # الن
|
|
265
265
|
|
|
266
266
|
sub "\u0626", "êy" # ئ
|
|
267
267
|
}
|