interscript-maps 2.2.0 → 2.2.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
@@ -4,8 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kat
|
5
5
|
source_script: Geor
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
8
|
-
|
7
|
+
name: Romanization of Georgian Personal Names (2015), ICS 630-01 Annex E
|
9
8
|
# url:
|
10
9
|
source: ICS 630-01, Annex E
|
11
10
|
creation_date: 2015
|
@@ -16,7 +15,7 @@ metadata {
|
|
16
15
|
eliminate variations of a name that can contribute forensic information. Rather, it is to provide an
|
17
16
|
IC standard Romanized (English) transliteration from Georgian that can then be linked to forensic
|
18
17
|
information in ways that will help identify the referent of the name.
|
19
|
-
|
18
|
+
|
20
19
|
notes:
|
21
20
|
}
|
22
21
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kaz
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Kazakh Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex Q
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kir
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Kyrgyz Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex R
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:kor
|
5
5
|
source_script: Hang
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Korean Personal Names (2015), ICS-630-01 Annex W
|
8
8
|
url:
|
9
9
|
creation_date: 2015
|
10
10
|
adoption_date:
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mkd
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Macedonian Personal Names (2005)
|
8
8
|
creation_date: 2005
|
9
9
|
confirmation_date: 2005
|
10
10
|
description: |
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:mkd
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of macedonian Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex H
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-3:prs
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015-11
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-3:prs
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Pashto Personal Names (2011)
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Pashto%20June%202011.pdf
|
9
9
|
creation_date: 2011
|
10
10
|
confirmation_date: 2011-06
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:rus
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Russian Personal Names (2015), ICS-630-01 Annex K
|
8
8
|
|
9
9
|
# url:
|
10
10
|
source: ICS-630-01 Annex K
|
@@ -4,12 +4,12 @@ metadata {
|
|
4
4
|
language: iso-639-2:srp
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Serbian Personal Names (2004)
|
8
8
|
creation_date: 2005
|
9
9
|
confirmation_date: 2005
|
10
10
|
description: |
|
11
11
|
Office of the Director Of National Intelligence Serbian Personal Names 2004 System
|
12
|
-
|
12
|
+
|
13
13
|
notes:
|
14
14
|
}
|
15
15
|
|
@@ -4,8 +4,8 @@ metadata {
|
|
4
4
|
language: iso-639-2:srp
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
8
|
-
|
7
|
+
name: Romanization of Serbian Personal Names (2015), ICS-630-01 Annex L
|
8
|
+
|
9
9
|
# url:
|
10
10
|
source: ICS-630-01 Annex L
|
11
11
|
creation_date: 2015
|
@@ -16,27 +16,27 @@ metadata {
|
|
16
16
|
is not intended to eliminate variations of a name that can contribute forensic information. Rather,
|
17
17
|
it is to provide an IC standard Romanized (English) transliteration from Serbian that can then be
|
18
18
|
linked to forensic information in ways that will help identify the referent of the name.
|
19
|
-
|
19
|
+
|
20
20
|
In cases where an individual’s name has already been transliterated in a variant spelling, the IC
|
21
21
|
Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the first
|
22
22
|
usage. In addition, if the original Cyrillic spelling is known, that spelling should also appear in
|
23
23
|
parentheses following the name, if possible, following best practices of the issuing organization
|
24
24
|
and taking into consideration information system capabilities. This convention is designed to
|
25
25
|
ensure that vital forensic information is not lost.
|
26
|
-
|
26
|
+
|
27
27
|
For names of persons who are known to not be part of the Serbian-speaking community, use the
|
28
28
|
relevant IC transliteration standard for names from that language (e.g., Mikhail, Yitzhak). A
|
29
29
|
translator’s note may be used to clarify the known origin of the person. Spell names of
|
30
30
|
individuals from languages that are written in Roman letters as they are spelled in those
|
31
31
|
languages (e.g., George Clooney, Jorge Garcia, Georges Pompidou).
|
32
|
-
|
32
|
+
|
33
33
|
In the case of active senior government officials in the on-line CIA World Factbook and the online directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings
|
34
34
|
given in these on-line reference works should be used in place of the IC Standard. For any
|
35
35
|
individual who has at one time been listed in the Factbook or Chiefs of State directory but who no
|
36
36
|
longer appears in those resources (i.e. is no longer a government official), the IC Standard
|
37
37
|
spelling should appear first, with the spelling, if known, as it previously appeared in those
|
38
38
|
resources listed within parentheses at the first usage.
|
39
|
-
|
39
|
+
|
40
40
|
The primary goal is to produce a consistent Romanized transcription of names that is specifically
|
41
41
|
readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
|
42
42
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use
|
@@ -44,7 +44,7 @@ metadata {
|
|
44
44
|
individual is provided, the referent will be clearly identified. This system will be used in
|
45
45
|
conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
|
46
46
|
names of well-known individuals.
|
47
|
-
|
47
|
+
|
48
48
|
notes:
|
49
49
|
}
|
50
50
|
|
@@ -93,7 +93,7 @@ stage {
|
|
93
93
|
sub "\u0427", "C" # Ч
|
94
94
|
sub "\u040F", "Dz" # Џ
|
95
95
|
sub "\u0428", "S" # Ш
|
96
|
-
|
96
|
+
|
97
97
|
sub "\u0430", "a" # а
|
98
98
|
sub "\u0431", "b" # б
|
99
99
|
sub "\u0432", "v" # в
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:tat
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Tatar Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex S
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:tgk
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Tajik Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex N
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:tuk
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Turkmen Personal Names (2015)
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20T%20-%20Turkmen_Personal_Names_FLTS%20(U).pdf
|
9
9
|
source: ICS-630-01 Annex T
|
10
10
|
creation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:uig
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Uyghur Personal Names (2015)
|
8
8
|
source: ICS-630-01 Annex U
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ukr
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Ukrainian Personal Names (2015), ICS 630-01 Annex M
|
8
8
|
|
9
9
|
# url:
|
10
10
|
source: ICS 630-01, Annex M
|
@@ -4,8 +4,8 @@ metadata {
|
|
4
4
|
language: iso-639-2:urd
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
8
|
-
|
7
|
+
name: Romanization of Hindi and Urdu Personal Names (2015), ICS-630-01 Annex F
|
8
|
+
|
9
9
|
#url:
|
10
10
|
creation_date: 2015
|
11
11
|
confirmation_date: 2015
|
@@ -16,7 +16,7 @@ metadata {
|
|
16
16
|
forensic information. Rather, it is to provide an IC standard Romanized (English)
|
17
17
|
transliteration from standard Hindi and Urdu that can then be linked to forensic
|
18
18
|
information in ways that will help identify the referent of the name.
|
19
|
-
|
19
|
+
|
20
20
|
There are typically a number of ways that names can be Romanized from either
|
21
21
|
Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
|
22
22
|
Romanization of Hindi and Urdu names for several reasons, including the fact that some
|
@@ -31,7 +31,7 @@ metadata {
|
|
31
31
|
And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
|
32
32
|
anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
|
33
33
|
transliterations may either reflect spelling or pronunciation in such cases.
|
34
|
-
|
34
|
+
|
35
35
|
Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
|
36
36
|
Urdu transliterations as much as possible. In the area of names, this can become
|
37
37
|
problematic when the Urdu spelling accurately reflects original Arabic spelling while the
|
@@ -40,7 +40,7 @@ metadata {
|
|
40
40
|
either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
|
41
41
|
spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
|
42
42
|
However, this is not always possible (see Hindi va versus Urdu wau).
|
43
|
-
|
43
|
+
|
44
44
|
In cases where an individual’s name has already been transliterated, that is to be indicated
|
45
45
|
– as found – in parentheses immediately following its rendition in the transliteration
|
46
46
|
standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
|
@@ -48,14 +48,14 @@ metadata {
|
|
48
48
|
parentheses following the name, if possible, following best practices of the issuing
|
49
49
|
organization and taking into consideration information system capabilities. This
|
50
50
|
convention is designed to ensure that vital forensic information is not lost.
|
51
|
-
|
51
|
+
|
52
52
|
For names of persons who are known to not be part of the Hindi- or Urdu-speaking
|
53
53
|
community, use the relevant IC transliteration standard for names from that language
|
54
54
|
(e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
|
55
55
|
the person. Spell names of individuals from languages that are written in Roman letters as
|
56
56
|
they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
|
57
57
|
Pompidou).
|
58
|
-
|
58
|
+
|
59
59
|
In the case of active senior government officials in the on-line CIA World Factbook and
|
60
60
|
the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
|
61
61
|
the spellings given in these on-line reference works should be used in place of the IC
|
@@ -64,7 +64,7 @@ metadata {
|
|
64
64
|
government official), the IC Standard spelling should appear first, with the spelling, if
|
65
65
|
known, as it previously appeared in those resources listed within parentheses at the first
|
66
66
|
usage.
|
67
|
-
|
67
|
+
|
68
68
|
The primary goal of this system is to produce a consistent Romanized transcription of the
|
69
69
|
name that is readable to the non-specialist. The system uses the 26 letters of the standard
|
70
70
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without
|
@@ -72,16 +72,16 @@ metadata {
|
|
72
72
|
information about the individual is provided, the referent will be clearly identified.
|
73
73
|
Additionally, this system will be used in conjunction with on-line tools, name dictionaries
|
74
74
|
and lists containing conventional spellings of names of well-known individuals
|
75
|
-
|
75
|
+
|
76
76
|
notes:
|
77
|
-
|
77
|
+
|
78
78
|
- |
|
79
79
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
80
80
|
The borrowed Arabic name Samir could represent two distinct names, one with a
|
81
81
|
long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
|
82
82
|
/ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
|
83
83
|
distinguish between these.
|
84
|
-
|
84
|
+
|
85
85
|
- |
|
86
86
|
No distinction is made between: retroflex and non-retroflex consonants; and
|
87
87
|
nasalized vowels and vowels followed by /n/.
|
@@ -150,8 +150,8 @@ stage {
|
|
150
150
|
|
151
151
|
# CHARACTERS
|
152
152
|
parallel {
|
153
|
-
|
154
|
-
|
153
|
+
|
154
|
+
|
155
155
|
sub "\u0622", "a" # ARABIC ALEF W/MADDA ABOVE
|
156
156
|
sub "\u0627", "a" # or u ARABIC ALEF
|
157
157
|
sub "\u06cc", "i" # or ai or u ARABIC LETTER WAW
|
@@ -170,9 +170,9 @@ stage {
|
|
170
170
|
sub "\u06c2", "-e" # ARABIC LETTER HEH GOAL WITH HAMZA ABOVE
|
171
171
|
sub "\u06c1\u0650", "o" # ARABIC LETTER YEH WITH HAMZA ABOVE
|
172
172
|
sub "\u0624", "au" # ARABIC LETTER WAW WITH HAMZA ABOVE
|
173
|
-
|
174
|
-
|
175
|
-
|
173
|
+
|
174
|
+
|
175
|
+
|
176
176
|
sub "\u06a9", "k" # ARABIC LETTER KEHEH
|
177
177
|
sub "\u0642", "q" # ARABIC LETTER QAF
|
178
178
|
sub "\u062e", "kh" # ARABIC LETTER KHAH
|
@@ -180,14 +180,14 @@ stage {
|
|
180
180
|
sub "\u063a", "gh" # ARABIC LETTER GHAIN
|
181
181
|
sub "\u0686", "ch" # ARABIC LETTER TCHEH
|
182
182
|
sub "\u062c", "j" # Arabic Letter Jeem
|
183
|
-
|
183
|
+
|
184
184
|
sub "\u0632", "z" # Arabic Letter ZAIN
|
185
185
|
sub "\u0630", "z" # Arabic Letter THAL
|
186
186
|
sub "\u0636", "z" # Arabic Letter DAD
|
187
187
|
sub "\u0638", "z" # Arabic Letter ZAH
|
188
188
|
sub "\u0698", "zh" # Arabic Letter JEH
|
189
|
-
|
190
|
-
|
189
|
+
|
190
|
+
|
191
191
|
sub "\u0679", "t" # ARABIC LETTER TTEH
|
192
192
|
sub "\u0688", "d" # Arabic Letter DDAL
|
193
193
|
sub "\u062f", "d" # Arabic Letter DAL
|
@@ -196,8 +196,8 @@ stage {
|
|
196
196
|
sub "\u0637", "t" # Arabic Letter TAH
|
197
197
|
sub "\u0646", "n" # Arabic Letter NOON
|
198
198
|
sub "\u06ba", "n" # Arabic Letter NOON GHUNNA
|
199
|
-
|
200
|
-
|
199
|
+
|
200
|
+
|
201
201
|
sub "\u067e", "p" # Arabic Letter PE
|
202
202
|
sub "\u0641", "f" # Arabic Letter FEH
|
203
203
|
sub "\u0628", "b" # Arabic Letter BEH
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:uzb
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Uzbek Personal Names (2015), ICS-630-01 Annex V
|
8
8
|
|
9
9
|
# url:
|
10
10
|
source: ICS-630-01 Annex V
|
@@ -129,20 +129,20 @@ stage {
|
|
129
129
|
|
130
130
|
|
131
131
|
# Sun letters
|
132
|
-
sub boundary + "\u0627\u0644\u062a", "el-t" # الت
|
133
|
-
sub boundary + "\u0627\u0644\u062b", any(["el-th", "el-t"]) # الث
|
134
|
-
sub boundary + "\u0627\u0644\u062f", "el-d" # الد
|
135
|
-
sub boundary + "\u0627\u0644\u0630", any(["el-dh", "el-z"]) # الذ
|
136
|
-
sub boundary + "\u0627\u0644\u0631", "el-r" # الر
|
137
|
-
sub boundary + "\u0627\u0644\u0632", "el-z" # الز
|
138
|
-
sub boundary + "\u0627\u0644\u0633", any(["el-s", "el-c"]) # الس
|
139
|
-
sub boundary + "\u0627\u0644\u0634", "el-sh" # الش
|
140
|
-
sub boundary + "\u0627\u0644\u0635", "el-ṣ" # الص
|
141
|
-
sub boundary + "\u0627\u0644\u0636", "el-ḍ" # الض
|
142
|
-
sub boundary + "\u0627\u0644\u0637", "el-ṭ" # الط
|
143
|
-
sub boundary + "\u0627\u0644\u0638", any(["el-ẓ", "el-d"]) # الظ
|
144
|
-
sub boundary + "\u0627\u0644\u0644", "el-l" # الل
|
145
|
-
sub boundary + "\u0627\u0644\u0646", "el-n" # الن
|
132
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "el-t" # الت
|
133
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), any(["el-th", "el-t"]) # الث
|
134
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "el-d" # الد
|
135
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), any(["el-dh", "el-z"]) # الذ
|
136
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "el-r" # الر
|
137
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "el-z" # الز
|
138
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), any(["el-s", "el-c"]) # الس
|
139
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "el-sh" # الش
|
140
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "el-ṣ" # الص
|
141
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "el-ḍ" # الض
|
142
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "el-ṭ" # الط
|
143
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), any(["el-ẓ", "el-d"]) # الظ
|
144
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "el-l" # الل
|
145
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "el-n" # الن
|
146
146
|
|
147
147
|
|
148
148
|
# shadda
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:amh
|
5
5
|
source_script: Ethi
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Amharic -- UNGEGN (2016)
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_am.pdf
|
9
9
|
creation_date: 1967
|
10
10
|
confirmation_date: 2016-03
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ara
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Arabic -- Beirut system (1971)
|
8
8
|
url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/2nd-uncsgn-docs/E_Conf61_4_Add1_e.pdf
|
9
9
|
creation_date: 1971
|
10
10
|
confirmation_date: 2018-06
|
@@ -85,10 +85,10 @@ stage {
|
|
85
85
|
parallel {
|
86
86
|
|
87
87
|
# sun letters
|
88
|
-
sub boundary + "\u0627\u0644\u062b", "at͟h t͟h" # الث
|
89
|
-
sub boundary + "\u0627\u0644\u0630", "ad͟h d͟h" # الذ
|
90
|
-
sub boundary + "\u0627\u0644\u0634", "as͟h s͟h" # الش
|
91
|
-
sub boundary + "\u0627\u0644\u0638", "az͟h z͟h" # الظ
|
88
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "at͟h t͟h" # الث
|
89
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "ad͟h d͟h" # الذ
|
90
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "as͟h s͟h" # الش
|
91
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az͟h z͟h" # الظ
|
92
92
|
|
93
93
|
# shadda
|
94
94
|
sub "\u062e\u0651", "k͟hk͟h" # خ
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:ara
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Arabic -- UNGEGN (1972)
|
8
8
|
url: http://www.eki.ee/wgrs/obs_rom_vers/rom1_ar_v4_0.pdf
|
9
9
|
creation_date: 1972
|
10
10
|
confirmation_date: 2018-06
|
@@ -107,9 +107,9 @@ stage {
|
|
107
107
|
# CHARACTERS
|
108
108
|
parallel {
|
109
109
|
|
110
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
111
|
-
sub boundary + "\u0627\u0644\u0636", "aḑ ḑ" # الض
|
112
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
110
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
111
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḑ ḑ" # الض
|
112
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
113
113
|
|
114
114
|
sub "\u062d\u0651", "ḩḩ" # ح
|
115
115
|
sub "\u0635\u0651", "şş" # ص
|