interscript-maps 2.2.0 → 2.2.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
@@ -4,14 +4,14 @@ metadata {
|
|
4
4
|
language: iso-639-2:isl
|
5
5
|
source_script: Latn
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Transliteration of Icelandic (1947)
|
8
8
|
url: https://github.com/interscript/interscript/files/5180785/BGN_Romanization_Guide_1964_icelandic_1947.pdf
|
9
9
|
creation_date: 1964
|
10
10
|
description: |
|
11
11
|
The BGN and the PCGn in 1947 jointly agreed to the transliteration of two letters of the Icelandic alphabet which,
|
12
12
|
although used in writing Old English, have disappeared from the modern English alphabet.
|
13
13
|
|
14
|
-
The transliterated letters are the edh (Ð ð) and the thorn (Þ þ),
|
14
|
+
The transliterated letters are the edh (Ð ð) and the thorn (Þ þ), pronounced as th in "thus" and th in "think," respectively.
|
15
15
|
|
16
16
|
It was felt that it was better to transliterate these letters into familiar symbols than preserve such unfamiliar letters in the nomenclature.
|
17
17
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:isl
|
5
5
|
source_script: Latn
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Roman-Script Spelling Convention of Icelandic (1968 Agreement)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693794/ROMAN-SCRIPT_SPELLING_CONVENTIONS.pdf
|
9
9
|
creation_date: 1968
|
10
10
|
|
@@ -4,13 +4,13 @@ metadata {
|
|
4
4
|
language: iso-639-2:kat
|
5
5
|
source_script: Geor
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Georgian (1981)
|
8
8
|
url: https://transliteration.eki.ee/pdf/Georgian.pdf
|
9
9
|
creation_date: 1981
|
10
10
|
confirmation_date: 1981
|
11
11
|
description: |
|
12
12
|
BGN/PCGN system of 1981.
|
13
|
-
|
13
|
+
|
14
14
|
notes:
|
15
15
|
}
|
16
16
|
|
@@ -75,18 +75,18 @@ stage {
|
|
75
75
|
sub "\u10d4", "e" # ე
|
76
76
|
sub "\u10d5", "v" # ვ
|
77
77
|
sub "\u10d6", "z" # ზ
|
78
|
-
|
78
|
+
|
79
79
|
sub "\u10f1", "ey" # ჱ
|
80
|
-
|
80
|
+
|
81
81
|
sub "\u10d7", "t’" # თ
|
82
82
|
sub "\u10d8", "i" # ი
|
83
83
|
sub "\u10d9", "k’" # კ
|
84
84
|
sub "\u10da", "l" # ლ
|
85
85
|
sub "\u10db", "m" # მ
|
86
86
|
sub "\u10dc", "n" # ნ
|
87
|
-
|
87
|
+
|
88
88
|
sub "\u10f2", "j" # ჲ
|
89
|
-
|
89
|
+
|
90
90
|
sub "\u10dd", "o" # ო
|
91
91
|
sub "\u10de", "p" # პ
|
92
92
|
sub "\u10df", "zh" # ჟ
|
@@ -105,9 +105,9 @@ stage {
|
|
105
105
|
sub "\u10ec", "ts" # წ
|
106
106
|
sub "\u10ed", "ch" # ჭ
|
107
107
|
sub "\u10ee", "kh" # ხ
|
108
|
-
|
108
|
+
|
109
109
|
sub "\u10f4", "q’" # ჴ
|
110
|
-
|
110
|
+
|
111
111
|
sub "\u10ef", "j" # ჯ
|
112
112
|
sub "\u10f0", "h" # ჰ
|
113
113
|
}
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kat
|
5
5
|
source_script: Geor
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Georgian (2009 Agreement, Georgia 2011 national system)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/810202/ROMANIZATION_OF_GEORGIAN.pdf
|
9
9
|
creation_date: 2009
|
10
10
|
confirmation_date: 2011
|
@@ -16,7 +16,7 @@ metadata {
|
|
16
16
|
the Mkhedruli alphabet, as presently used in Georgia. This system was
|
17
17
|
adopted by BGN and PCGN in 2009, superseding the BGN/PCGN system of
|
18
18
|
1981.
|
19
|
-
|
19
|
+
|
20
20
|
notes:
|
21
21
|
- This system denotes ejective (glottalised) consonants by means of
|
22
22
|
an apostrophe. The BGN/PCGN 1981 system instead used the apostrophe to
|
@@ -1,18 +1,18 @@
|
|
1
1
|
metadata {
|
2
|
-
|
2
|
+
|
3
3
|
authority_id: bgnpcgn
|
4
4
|
id: 1979
|
5
5
|
language: iso-639-2:kaz
|
6
6
|
source_script: Cyrl
|
7
7
|
destination_script: Latn
|
8
|
-
name: Romanization of Kazakh
|
8
|
+
name: Romanization of Kazakh (1979)
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811511/ROMANIZATION_OF_KAZAKH.pdf
|
10
10
|
creation_date: 1979
|
11
11
|
confirmation_date: 2019
|
12
12
|
description: |
|
13
13
|
The BGN/PCGN system for Kazakh was designed for use in romanizing names written in the Kazakh Cyrillic alphabet.
|
14
14
|
The Kazakh Cyrillic alphabet contains nine characters not present in the Russian alphabet: ә, ғ, қ, ң, ө, ұ, ү, һ and і.
|
15
|
-
|
15
|
+
|
16
16
|
notes:
|
17
17
|
- The character sequences гһ, зһ, кһ, нг, сһ and цһ may be romanized g·h, z·h, k·h, n·g, s·h
|
18
18
|
and ts·h in order to differentiate those romanizations from from the digraphs gh, zh, kh, ng, sh,
|
@@ -144,7 +144,7 @@ stage {
|
|
144
144
|
sub "\u042D", "Ė" # Э
|
145
145
|
sub "\u042E", "Yu" # Ю
|
146
146
|
sub "\u042F", "Ya" # Я
|
147
|
-
|
147
|
+
|
148
148
|
sub "\u0430", "a" # а
|
149
149
|
sub "\u04D9", "ä" # ә
|
150
150
|
sub "\u0431", "b" # б
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kir
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name: Romanization of Kyrgyz
|
7
|
+
name: Romanization of Kyrgyz (1979)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/816663/ROMANIZATION_OF_KYRGYZ.pdf
|
9
9
|
creation_date: 1979
|
10
10
|
confirmation_date: 2019
|
@@ -12,7 +12,7 @@ metadata {
|
|
12
12
|
The BGN/PCGN system for Kyrgyz Cyrillic was designed for use in romanizing names written
|
13
13
|
in the Kyrgyz Cyrillic alphabet. The Kyrgyz Cyrillic alphabet contains three characters not present in
|
14
14
|
the Russian alphabet: Ң , Ө, and Y.
|
15
|
-
|
15
|
+
|
16
16
|
notes:
|
17
17
|
- Both Kyrgyz and Kirghiz may frequently be seen as the language name; both these spellings are used in the
|
18
18
|
ISO 639 Standard on the representation of names for languages.
|
@@ -127,7 +127,7 @@ stage {
|
|
127
127
|
sub "\u042D", "E" # Э
|
128
128
|
sub "\u042E", "Yu" # Ю
|
129
129
|
sub "\u042F", "Ya" # Я
|
130
|
-
|
130
|
+
|
131
131
|
sub "\u0430", "a" # а
|
132
132
|
sub "\u0431", "b" # б
|
133
133
|
sub "\u0432", "v" # в
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kor
|
5
5
|
source_script: Hang
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Korean -- For DPRK (Hangul to Latin) (1945 Agreement)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693725/ROMANIZATION_OF_KOREAN-_MR_for_DPRK.pdf
|
9
9
|
creation_date: 1945
|
10
10
|
adoption_date:
|
@@ -4,10 +4,10 @@ metadata {
|
|
4
4
|
language: iso-639-2:kor
|
5
5
|
source_script: Hang
|
6
6
|
destination_script: Latn
|
7
|
-
name: Ministry of Culture and Tourism System (2000)
|
8
|
-
url:
|
9
|
-
creation_date:
|
10
|
-
adoption_date:
|
7
|
+
name: Romanization of Korean -- For the ROK (2011 Agreement, Ministry of Culture and Tourism System (2000))
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693724/ROMANIZATION_OF_KOREAN-__MOCT_for_ROK.pdf
|
9
|
+
creation_date: 2011
|
10
|
+
adoption_date: 2011
|
11
11
|
description:
|
12
12
|
|
13
13
|
notes:
|
@@ -4,10 +4,11 @@ metadata {
|
|
4
4
|
language: iso-639-2:kor
|
5
5
|
source_script: Kore
|
6
6
|
destination_script: Latn
|
7
|
-
name: Ministry of Culture and Tourism System (2000)
|
7
|
+
name: Romanization of Korean -- For the ROK -- Korean to Latin (2011 Agreement, Ministry of Culture and Tourism System (2000))
|
8
|
+
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693724/ROMANIZATION_OF_KOREAN-__MOCT_for_ROK.pdf
|
8
9
|
url: ""
|
9
|
-
creation_date:
|
10
|
-
adoption_date:
|
10
|
+
creation_date: 2011
|
11
|
+
adoption_date: 2011
|
11
12
|
description: |
|
12
13
|
Establishes a system for the transliteration of the characters of Korean script into Latin characters.
|
13
14
|
Intended to provide a means for international communication of written documents.
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: kur
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Kurdish (2007)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693727/ROMANIZATION_OF_KURDISH.pdf
|
9
9
|
creation_date: 2007
|
10
10
|
confirmation_date: 2017-12
|
@@ -4,10 +4,10 @@ metadata {
|
|
4
4
|
language: iso-639-2:mkd
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization for Macedonian (1981)
|
8
8
|
url: https://github.com/riboseinc/interscript/files/4247920/USBGN_romanization_Macedonian_1981.pdf
|
9
9
|
creation_date: 1981
|
10
|
-
description: BGN/PCGN Romanization table for
|
10
|
+
description: BGN/PCGN Romanization table for Macedonian.
|
11
11
|
|
12
12
|
notes:
|
13
13
|
- The character ѓ should be romanized g when it occurs before е and и. In other
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mkd
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization for Macedonian (2013)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811514/ROMANIZATION_OF_MACEDONIAN.pdf
|
9
9
|
creation_date: 2013
|
10
10
|
description: |
|
@@ -4,10 +4,10 @@ metadata {
|
|
4
4
|
language: iso-639-2:mon
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Mongolian (1964)
|
8
8
|
url: https://github.com/interscript/interscript/files/5180767/BGN_Romanization_Guide_1964_mongolian_1964.pdf
|
9
|
-
creation_date:
|
10
|
-
confirmation_date:
|
9
|
+
creation_date: 1964
|
10
|
+
confirmation_date: 1964
|
11
11
|
description: |
|
12
12
|
This system was originated by the PCGN in 1957 and adopted as a
|
13
13
|
BGN/PCGN System in 1964. It is intended for use in the romanization of
|
@@ -1,14 +1,14 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: bgnpcgn
|
3
|
-
id:
|
3
|
+
id: 2011
|
4
4
|
language: iso-639-2:nep
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name: Nepali
|
7
|
+
name: Romanization for Nepali (2011 Agreement)
|
8
8
|
url: https://geonames.nga.mil/gns/html/Romanization/ROMANIZATION%20OF%20NEPALI.pdf
|
9
|
-
creation_date:
|
9
|
+
creation_date: 2011
|
10
|
+
confirmation_date: 2017
|
10
11
|
description: |
|
11
|
-
BGN/PCGN 2011 Agreement Romanization of Nepali
|
12
12
|
The BGN and the PCGN have adopted the Nepal Survey Department (NSD) system for the
|
13
13
|
romanization of Nepali names. This system, below, should be applied to Nepali names for which Roman‐
|
14
14
|
script spellings in materials produced by the government of Nepal are not available.
|
@@ -1,14 +1,14 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: bgnpcgn
|
3
|
-
id:
|
3
|
+
id: 1958
|
4
4
|
language: iso-639-3:prs
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
6
6
|
source_script: Arab
|
7
7
|
destination_script: Latn
|
8
|
-
name:
|
8
|
+
name: Transliteration System for Persian (1958)
|
9
9
|
url: https://github.com/interscript/interscript/files/5180821/BGN_Romanization_Guide_1964_persian_1958.pdf
|
10
10
|
creation_date: 1958
|
11
|
-
confirmation_date:
|
11
|
+
confirmation_date: 1958
|
12
12
|
description: |
|
13
13
|
The BGN/PCGN 1958 System for the Persian alphabet was
|
14
14
|
adopted by the BGN in 1946 and by the PCGN In 1958. It Is
|
@@ -30,11 +30,11 @@ metadata {
|
|
30
30
|
Arabic in that the short vowel symbols necessary for the
|
31
31
|
proper rendering of short vowels, long vowels, and
|
32
32
|
diphthongs are almost always omitted from written Persian.
|
33
|
-
It follows that, in order to produce
|
33
|
+
It follows that, in order to produce transliterations in
|
34
34
|
terms of standard written Persian, the transliterator must
|
35
35
|
be able to identify the words used in names and must know
|
36
36
|
their standard written Persian spelling, their proper vowel
|
37
|
-
pointing, and how to eliminate
|
37
|
+
pointing, and how to eliminate peculiarities due to
|
38
38
|
dialectical variation.
|
39
39
|
The notes and special rules explain details of
|
40
40
|
transliteration not stated in the tables.
|
@@ -240,20 +240,20 @@ stage {
|
|
240
240
|
# '\uFE8E' : '' # ﺎ
|
241
241
|
|
242
242
|
# Sun letters
|
243
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
244
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
245
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
246
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
247
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
248
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
249
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
250
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
251
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
252
|
-
sub boundary + "\u0627\u0644\u0636", "aẕ ẕ" # الض
|
253
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
254
|
-
sub boundary + "\u0627\u0644\u0638", "az̧ z̧" # الظ
|
255
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
256
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
243
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
244
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
245
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
246
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
247
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
248
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
249
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
250
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
251
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
252
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aẕ ẕ" # الض
|
253
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
254
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az̧ z̧" # الظ
|
255
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
256
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
257
257
|
|
258
258
|
|
259
259
|
sub "\u0621", "’" # ء
|
@@ -5,7 +5,7 @@ metadata {
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
6
6
|
source_script: Arab
|
7
7
|
destination_script: Latn
|
8
|
-
name:
|
8
|
+
name: National Romanization System for Afghanistan (2007)
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693661/ROMANIZATION_FOR_AFGHANISTAN.pdf
|
10
10
|
creation_date: 2007
|
11
11
|
confirmation_date: 2017-11
|
@@ -461,20 +461,20 @@ stage {
|
|
461
461
|
# '\uFE8E' : '' # ﺎ
|
462
462
|
|
463
463
|
# Sun letters
|
464
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
465
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
466
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
467
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
468
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
469
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
470
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
471
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
472
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
473
|
-
sub boundary + "\u0627\u0644\u0636", "aẕ ẕ" # الض
|
474
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
475
|
-
sub boundary + "\u0627\u0644\u0638", "az̧ z̧" # الظ
|
476
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
477
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
464
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
465
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
466
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
467
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
468
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
469
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
470
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
471
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
472
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
473
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aẕ ẕ" # الض
|
474
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
475
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az̧ z̧" # الظ
|
476
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
477
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
478
478
|
|
479
479
|
|
480
480
|
# consonant characters
|
@@ -5,7 +5,7 @@ metadata {
|
|
5
5
|
# prs stands for Dari (https://iso639-3.sil.org/code/prs&_ga=GA1.2.2054538372.1574092823)
|
6
6
|
source_script: Arab
|
7
7
|
destination_script: Latn
|
8
|
-
name:
|
8
|
+
name: National Romanization System for Afghanistan -- Yaghoubi (2007)
|
9
9
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693661/ROMANIZATION_FOR_AFGHANISTAN.pdf
|
10
10
|
creation_date: 2007
|
11
11
|
confirmation_date: 2017-11
|
@@ -379,20 +379,20 @@ stage {
|
|
379
379
|
|
380
380
|
|
381
381
|
# Sun letters
|
382
|
-
sub boundary + "\u0627\u0644\u062a", "at̄ t̄" # الت
|
383
|
-
sub boundary + "\u0627\u0644\u062b", "as̄ s̄" # الث
|
384
|
-
sub boundary + "\u0627\u0644\u062f", "aḏ ḏ" # الد
|
385
|
-
sub boundary + "\u0627\u0644\u0630", "az̄ z̄" # الذ
|
386
|
-
sub boundary + "\u0627\u0644\u0631", "aṟ ṟ" # الر
|
387
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
388
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
389
|
-
sub boundary + "\u0627\u0644\u0634", "aš š" # الش
|
390
|
-
sub boundary + "\u0627\u0644\u0635", "as̱ s̱" # الص
|
391
|
-
sub boundary + "\u0627\u0644\u0636", "ad͟z d͟z" # الض
|
392
|
-
sub boundary + "\u0627\u0644\u0637", "aṯ ṯ" # الط
|
393
|
-
sub boundary + "\u0627\u0644\u0638", "aẕ ẕ" # الظ
|
394
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
395
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
382
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at̄ t̄" # الت
|
383
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as̄ s̄" # الث
|
384
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "aḏ ḏ" # الد
|
385
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az̄ z̄" # الذ
|
386
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "aṟ ṟ" # الر
|
387
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
388
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
389
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "aš š" # الش
|
390
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as̱ s̱" # الص
|
391
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "ad͟z d͟z" # الض
|
392
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aṯ ṯ" # الط
|
393
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "aẕ ẕ" # الظ
|
394
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
395
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
396
396
|
|
397
397
|
# consonant characters
|
398
398
|
|
@@ -1,10 +1,10 @@
|
|
1
1
|
metadata {
|
2
2
|
authority_id: bgnpcgn
|
3
|
-
id:
|
3
|
+
id: 1968
|
4
4
|
language: iso-639-3:prs
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Pashto (1968)
|
8
8
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693760/ROMANIZATION_OF_PASHTO.pdf
|
9
9
|
creation_date: 1968
|
10
10
|
confirmation_date: 2017-11
|
@@ -248,20 +248,20 @@ stage {
|
|
248
248
|
sub "\u0659", "ê"
|
249
249
|
|
250
250
|
# Sun letters
|
251
|
-
sub boundary + "\u0627\u0644\u062a", "ut t" # الت
|
252
|
-
sub boundary + "\u0627\u0644\u062b", "us̄ s̄" # الث
|
253
|
-
sub boundary + "\u0627\u0644\u062f", "ud d" # الد
|
254
|
-
sub boundary + "\u0627\u0644\u0630", "uz̄ z̄" # الذ
|
255
|
-
sub boundary + "\u0627\u0644\u0631", "ur r" # الر
|
256
|
-
sub boundary + "\u0627\u0644\u0632", "uz z" # الز
|
257
|
-
sub boundary + "\u0627\u0644\u0633", "us s" # الس
|
258
|
-
sub boundary + "\u0627\u0644\u0634", "ush sh" # الش
|
259
|
-
sub boundary + "\u0627\u0644\u0635", "uş ş" # الص
|
260
|
-
sub boundary + "\u0627\u0644\u0636", "uẕ ẕ" # الض
|
261
|
-
sub boundary + "\u0627\u0644\u0637", "uţ ţ" # الط
|
262
|
-
sub boundary + "\u0627\u0644\u0638", "uz̧ z̧" # الظ
|
263
|
-
sub boundary + "\u0627\u0644\u0644", "ul l" # الل
|
264
|
-
sub boundary + "\u0627\u0644\u0646", "un n" # الن
|
251
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "ut t" # الت
|
252
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "us̄ s̄" # الث
|
253
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ud d" # الد
|
254
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "uz̄ z̄" # الذ
|
255
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ur r" # الر
|
256
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "uz z" # الز
|
257
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "us s" # الس
|
258
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ush sh" # الش
|
259
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "uş ş" # الص
|
260
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "uẕ ẕ" # الض
|
261
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "uţ ţ" # الط
|
262
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "uz̧ z̧" # الظ
|
263
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "ul l" # الل
|
264
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "un n" # الن
|
265
265
|
|
266
266
|
sub "\u0626", "êy" # ئ
|
267
267
|
}
|