interscript-maps 2.2.0 → 2.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
|
@@ -4,8 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kat
|
|
5
5
|
source_script: Geor
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
8
|
-
|
|
7
|
+
name: Romanization of Georgian Personal Names (2015), ICS 630-01 Annex E
|
|
9
8
|
# url:
|
|
10
9
|
source: ICS 630-01, Annex E
|
|
11
10
|
creation_date: 2015
|
|
@@ -16,7 +15,7 @@ metadata {
|
|
|
16
15
|
eliminate variations of a name that can contribute forensic information. Rather, it is to provide an
|
|
17
16
|
IC standard Romanized (English) transliteration from Georgian that can then be linked to forensic
|
|
18
17
|
information in ways that will help identify the referent of the name.
|
|
19
|
-
|
|
18
|
+
|
|
20
19
|
notes:
|
|
21
20
|
}
|
|
22
21
|
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kaz
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Kazakh Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex Q
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kir
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Kyrgyz Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex R
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:kor
|
|
5
5
|
source_script: Hang
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Korean Personal Names (2015), ICS-630-01 Annex W
|
|
8
8
|
url:
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
adoption_date:
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mkd
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Macedonian Personal Names (2005)
|
|
8
8
|
creation_date: 2005
|
|
9
9
|
confirmation_date: 2005
|
|
10
10
|
description: |
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mkd
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of macedonian Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex H
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-3:prs
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
|
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015-11
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-3:prs
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Pashto Personal Names (2011)
|
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Pashto%20June%202011.pdf
|
|
9
9
|
creation_date: 2011
|
|
10
10
|
confirmation_date: 2011-06
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:rus
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Russian Personal Names (2015), ICS-630-01 Annex K
|
|
8
8
|
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS-630-01 Annex K
|
|
@@ -4,12 +4,12 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:srp
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Serbian Personal Names (2004)
|
|
8
8
|
creation_date: 2005
|
|
9
9
|
confirmation_date: 2005
|
|
10
10
|
description: |
|
|
11
11
|
Office of the Director Of National Intelligence Serbian Personal Names 2004 System
|
|
12
|
-
|
|
12
|
+
|
|
13
13
|
notes:
|
|
14
14
|
}
|
|
15
15
|
|
|
@@ -4,8 +4,8 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:srp
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
8
|
-
|
|
7
|
+
name: Romanization of Serbian Personal Names (2015), ICS-630-01 Annex L
|
|
8
|
+
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS-630-01 Annex L
|
|
11
11
|
creation_date: 2015
|
|
@@ -16,27 +16,27 @@ metadata {
|
|
|
16
16
|
is not intended to eliminate variations of a name that can contribute forensic information. Rather,
|
|
17
17
|
it is to provide an IC standard Romanized (English) transliteration from Serbian that can then be
|
|
18
18
|
linked to forensic information in ways that will help identify the referent of the name.
|
|
19
|
-
|
|
19
|
+
|
|
20
20
|
In cases where an individual’s name has already been transliterated in a variant spelling, the IC
|
|
21
21
|
Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the first
|
|
22
22
|
usage. In addition, if the original Cyrillic spelling is known, that spelling should also appear in
|
|
23
23
|
parentheses following the name, if possible, following best practices of the issuing organization
|
|
24
24
|
and taking into consideration information system capabilities. This convention is designed to
|
|
25
25
|
ensure that vital forensic information is not lost.
|
|
26
|
-
|
|
26
|
+
|
|
27
27
|
For names of persons who are known to not be part of the Serbian-speaking community, use the
|
|
28
28
|
relevant IC transliteration standard for names from that language (e.g., Mikhail, Yitzhak). A
|
|
29
29
|
translator’s note may be used to clarify the known origin of the person. Spell names of
|
|
30
30
|
individuals from languages that are written in Roman letters as they are spelled in those
|
|
31
31
|
languages (e.g., George Clooney, Jorge Garcia, Georges Pompidou).
|
|
32
|
-
|
|
32
|
+
|
|
33
33
|
In the case of active senior government officials in the on-line CIA World Factbook and the online directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings
|
|
34
34
|
given in these on-line reference works should be used in place of the IC Standard. For any
|
|
35
35
|
individual who has at one time been listed in the Factbook or Chiefs of State directory but who no
|
|
36
36
|
longer appears in those resources (i.e. is no longer a government official), the IC Standard
|
|
37
37
|
spelling should appear first, with the spelling, if known, as it previously appeared in those
|
|
38
38
|
resources listed within parentheses at the first usage.
|
|
39
|
-
|
|
39
|
+
|
|
40
40
|
The primary goal is to produce a consistent Romanized transcription of names that is specifically
|
|
41
41
|
readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
|
|
42
42
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use
|
|
@@ -44,7 +44,7 @@ metadata {
|
|
|
44
44
|
individual is provided, the referent will be clearly identified. This system will be used in
|
|
45
45
|
conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
|
|
46
46
|
names of well-known individuals.
|
|
47
|
-
|
|
47
|
+
|
|
48
48
|
notes:
|
|
49
49
|
}
|
|
50
50
|
|
|
@@ -93,7 +93,7 @@ stage {
|
|
|
93
93
|
sub "\u0427", "C" # Ч
|
|
94
94
|
sub "\u040F", "Dz" # Џ
|
|
95
95
|
sub "\u0428", "S" # Ш
|
|
96
|
-
|
|
96
|
+
|
|
97
97
|
sub "\u0430", "a" # а
|
|
98
98
|
sub "\u0431", "b" # б
|
|
99
99
|
sub "\u0432", "v" # в
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:tat
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Tatar Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex S
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:tgk
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Tajik Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex N
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:tuk
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Turkmen Personal Names (2015)
|
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20T%20-%20Turkmen_Personal_Names_FLTS%20(U).pdf
|
|
9
9
|
source: ICS-630-01 Annex T
|
|
10
10
|
creation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:uig
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Uyghur Personal Names (2015)
|
|
8
8
|
source: ICS-630-01 Annex U
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:ukr
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Ukrainian Personal Names (2015), ICS 630-01 Annex M
|
|
8
8
|
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS 630-01, Annex M
|
|
@@ -4,8 +4,8 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:urd
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
8
|
-
|
|
7
|
+
name: Romanization of Hindi and Urdu Personal Names (2015), ICS-630-01 Annex F
|
|
8
|
+
|
|
9
9
|
#url:
|
|
10
10
|
creation_date: 2015
|
|
11
11
|
confirmation_date: 2015
|
|
@@ -16,7 +16,7 @@ metadata {
|
|
|
16
16
|
forensic information. Rather, it is to provide an IC standard Romanized (English)
|
|
17
17
|
transliteration from standard Hindi and Urdu that can then be linked to forensic
|
|
18
18
|
information in ways that will help identify the referent of the name.
|
|
19
|
-
|
|
19
|
+
|
|
20
20
|
There are typically a number of ways that names can be Romanized from either
|
|
21
21
|
Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
|
|
22
22
|
Romanization of Hindi and Urdu names for several reasons, including the fact that some
|
|
@@ -31,7 +31,7 @@ metadata {
|
|
|
31
31
|
And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
|
|
32
32
|
anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
|
|
33
33
|
transliterations may either reflect spelling or pronunciation in such cases.
|
|
34
|
-
|
|
34
|
+
|
|
35
35
|
Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
|
|
36
36
|
Urdu transliterations as much as possible. In the area of names, this can become
|
|
37
37
|
problematic when the Urdu spelling accurately reflects original Arabic spelling while the
|
|
@@ -40,7 +40,7 @@ metadata {
|
|
|
40
40
|
either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
|
|
41
41
|
spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
|
|
42
42
|
However, this is not always possible (see Hindi va versus Urdu wau).
|
|
43
|
-
|
|
43
|
+
|
|
44
44
|
In cases where an individual’s name has already been transliterated, that is to be indicated
|
|
45
45
|
– as found – in parentheses immediately following its rendition in the transliteration
|
|
46
46
|
standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
|
|
@@ -48,14 +48,14 @@ metadata {
|
|
|
48
48
|
parentheses following the name, if possible, following best practices of the issuing
|
|
49
49
|
organization and taking into consideration information system capabilities. This
|
|
50
50
|
convention is designed to ensure that vital forensic information is not lost.
|
|
51
|
-
|
|
51
|
+
|
|
52
52
|
For names of persons who are known to not be part of the Hindi- or Urdu-speaking
|
|
53
53
|
community, use the relevant IC transliteration standard for names from that language
|
|
54
54
|
(e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
|
|
55
55
|
the person. Spell names of individuals from languages that are written in Roman letters as
|
|
56
56
|
they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
|
|
57
57
|
Pompidou).
|
|
58
|
-
|
|
58
|
+
|
|
59
59
|
In the case of active senior government officials in the on-line CIA World Factbook and
|
|
60
60
|
the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
|
|
61
61
|
the spellings given in these on-line reference works should be used in place of the IC
|
|
@@ -64,7 +64,7 @@ metadata {
|
|
|
64
64
|
government official), the IC Standard spelling should appear first, with the spelling, if
|
|
65
65
|
known, as it previously appeared in those resources listed within parentheses at the first
|
|
66
66
|
usage.
|
|
67
|
-
|
|
67
|
+
|
|
68
68
|
The primary goal of this system is to produce a consistent Romanized transcription of the
|
|
69
69
|
name that is readable to the non-specialist. The system uses the 26 letters of the standard
|
|
70
70
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without
|
|
@@ -72,16 +72,16 @@ metadata {
|
|
|
72
72
|
information about the individual is provided, the referent will be clearly identified.
|
|
73
73
|
Additionally, this system will be used in conjunction with on-line tools, name dictionaries
|
|
74
74
|
and lists containing conventional spellings of names of well-known individuals
|
|
75
|
-
|
|
75
|
+
|
|
76
76
|
notes:
|
|
77
|
-
|
|
77
|
+
|
|
78
78
|
- |
|
|
79
79
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
|
80
80
|
The borrowed Arabic name Samir could represent two distinct names, one with a
|
|
81
81
|
long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
|
|
82
82
|
/ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
|
|
83
83
|
distinguish between these.
|
|
84
|
-
|
|
84
|
+
|
|
85
85
|
- |
|
|
86
86
|
No distinction is made between: retroflex and non-retroflex consonants; and
|
|
87
87
|
nasalized vowels and vowels followed by /n/.
|
|
@@ -150,8 +150,8 @@ stage {
|
|
|
150
150
|
|
|
151
151
|
# CHARACTERS
|
|
152
152
|
parallel {
|
|
153
|
-
|
|
154
|
-
|
|
153
|
+
|
|
154
|
+
|
|
155
155
|
sub "\u0622", "a" # ARABIC ALEF W/MADDA ABOVE
|
|
156
156
|
sub "\u0627", "a" # or u ARABIC ALEF
|
|
157
157
|
sub "\u06cc", "i" # or ai or u ARABIC LETTER WAW
|
|
@@ -170,9 +170,9 @@ stage {
|
|
|
170
170
|
sub "\u06c2", "-e" # ARABIC LETTER HEH GOAL WITH HAMZA ABOVE
|
|
171
171
|
sub "\u06c1\u0650", "o" # ARABIC LETTER YEH WITH HAMZA ABOVE
|
|
172
172
|
sub "\u0624", "au" # ARABIC LETTER WAW WITH HAMZA ABOVE
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
173
|
+
|
|
174
|
+
|
|
175
|
+
|
|
176
176
|
sub "\u06a9", "k" # ARABIC LETTER KEHEH
|
|
177
177
|
sub "\u0642", "q" # ARABIC LETTER QAF
|
|
178
178
|
sub "\u062e", "kh" # ARABIC LETTER KHAH
|
|
@@ -180,14 +180,14 @@ stage {
|
|
|
180
180
|
sub "\u063a", "gh" # ARABIC LETTER GHAIN
|
|
181
181
|
sub "\u0686", "ch" # ARABIC LETTER TCHEH
|
|
182
182
|
sub "\u062c", "j" # Arabic Letter Jeem
|
|
183
|
-
|
|
183
|
+
|
|
184
184
|
sub "\u0632", "z" # Arabic Letter ZAIN
|
|
185
185
|
sub "\u0630", "z" # Arabic Letter THAL
|
|
186
186
|
sub "\u0636", "z" # Arabic Letter DAD
|
|
187
187
|
sub "\u0638", "z" # Arabic Letter ZAH
|
|
188
188
|
sub "\u0698", "zh" # Arabic Letter JEH
|
|
189
|
-
|
|
190
|
-
|
|
189
|
+
|
|
190
|
+
|
|
191
191
|
sub "\u0679", "t" # ARABIC LETTER TTEH
|
|
192
192
|
sub "\u0688", "d" # Arabic Letter DDAL
|
|
193
193
|
sub "\u062f", "d" # Arabic Letter DAL
|
|
@@ -196,8 +196,8 @@ stage {
|
|
|
196
196
|
sub "\u0637", "t" # Arabic Letter TAH
|
|
197
197
|
sub "\u0646", "n" # Arabic Letter NOON
|
|
198
198
|
sub "\u06ba", "n" # Arabic Letter NOON GHUNNA
|
|
199
|
-
|
|
200
|
-
|
|
199
|
+
|
|
200
|
+
|
|
201
201
|
sub "\u067e", "p" # Arabic Letter PE
|
|
202
202
|
sub "\u0641", "f" # Arabic Letter FEH
|
|
203
203
|
sub "\u0628", "b" # Arabic Letter BEH
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:uzb
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Uzbek Personal Names (2015), ICS-630-01 Annex V
|
|
8
8
|
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS-630-01 Annex V
|
|
@@ -129,20 +129,20 @@ stage {
|
|
|
129
129
|
|
|
130
130
|
|
|
131
131
|
# Sun letters
|
|
132
|
-
sub boundary + "\u0627\u0644\u062a", "el-t" # الت
|
|
133
|
-
sub boundary + "\u0627\u0644\u062b", any(["el-th", "el-t"]) # الث
|
|
134
|
-
sub boundary + "\u0627\u0644\u062f", "el-d" # الد
|
|
135
|
-
sub boundary + "\u0627\u0644\u0630", any(["el-dh", "el-z"]) # الذ
|
|
136
|
-
sub boundary + "\u0627\u0644\u0631", "el-r" # الر
|
|
137
|
-
sub boundary + "\u0627\u0644\u0632", "el-z" # الز
|
|
138
|
-
sub boundary + "\u0627\u0644\u0633", any(["el-s", "el-c"]) # الس
|
|
139
|
-
sub boundary + "\u0627\u0644\u0634", "el-sh" # الش
|
|
140
|
-
sub boundary + "\u0627\u0644\u0635", "el-ṣ" # الص
|
|
141
|
-
sub boundary + "\u0627\u0644\u0636", "el-ḍ" # الض
|
|
142
|
-
sub boundary + "\u0627\u0644\u0637", "el-ṭ" # الط
|
|
143
|
-
sub boundary + "\u0627\u0644\u0638", any(["el-ẓ", "el-d"]) # الظ
|
|
144
|
-
sub boundary + "\u0627\u0644\u0644", "el-l" # الل
|
|
145
|
-
sub boundary + "\u0627\u0644\u0646", "el-n" # الن
|
|
132
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "el-t" # الت
|
|
133
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), any(["el-th", "el-t"]) # الث
|
|
134
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "el-d" # الد
|
|
135
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), any(["el-dh", "el-z"]) # الذ
|
|
136
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "el-r" # الر
|
|
137
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "el-z" # الز
|
|
138
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), any(["el-s", "el-c"]) # الس
|
|
139
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "el-sh" # الش
|
|
140
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "el-ṣ" # الص
|
|
141
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "el-ḍ" # الض
|
|
142
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "el-ṭ" # الط
|
|
143
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), any(["el-ẓ", "el-d"]) # الظ
|
|
144
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "el-l" # الل
|
|
145
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "el-n" # الن
|
|
146
146
|
|
|
147
147
|
|
|
148
148
|
# shadda
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:amh
|
|
5
5
|
source_script: Ethi
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Amharic -- UNGEGN (2016)
|
|
8
8
|
url: http://www.eki.ee/wgrs/rom1_am.pdf
|
|
9
9
|
creation_date: 1967
|
|
10
10
|
confirmation_date: 2016-03
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:ara
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Arabic -- Beirut system (1971)
|
|
8
8
|
url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/2nd-uncsgn-docs/E_Conf61_4_Add1_e.pdf
|
|
9
9
|
creation_date: 1971
|
|
10
10
|
confirmation_date: 2018-06
|
|
@@ -85,10 +85,10 @@ stage {
|
|
|
85
85
|
parallel {
|
|
86
86
|
|
|
87
87
|
# sun letters
|
|
88
|
-
sub boundary + "\u0627\u0644\u062b", "at͟h t͟h" # الث
|
|
89
|
-
sub boundary + "\u0627\u0644\u0630", "ad͟h d͟h" # الذ
|
|
90
|
-
sub boundary + "\u0627\u0644\u0634", "as͟h s͟h" # الش
|
|
91
|
-
sub boundary + "\u0627\u0644\u0638", "az͟h z͟h" # الظ
|
|
88
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "at͟h t͟h" # الث
|
|
89
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "ad͟h d͟h" # الذ
|
|
90
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "as͟h s͟h" # الش
|
|
91
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az͟h z͟h" # الظ
|
|
92
92
|
|
|
93
93
|
# shadda
|
|
94
94
|
sub "\u062e\u0651", "k͟hk͟h" # خ
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:ara
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Arabic -- UNGEGN (1972)
|
|
8
8
|
url: http://www.eki.ee/wgrs/obs_rom_vers/rom1_ar_v4_0.pdf
|
|
9
9
|
creation_date: 1972
|
|
10
10
|
confirmation_date: 2018-06
|
|
@@ -107,9 +107,9 @@ stage {
|
|
|
107
107
|
# CHARACTERS
|
|
108
108
|
parallel {
|
|
109
109
|
|
|
110
|
-
sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
|
|
111
|
-
sub boundary + "\u0627\u0644\u0636", "aḑ ḑ" # الض
|
|
112
|
-
sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
|
|
110
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
|
|
111
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḑ ḑ" # الض
|
|
112
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
|
|
113
113
|
|
|
114
114
|
sub "\u062d\u0651", "ḩḩ" # ح
|
|
115
115
|
sub "\u0635\u0651", "şş" # ص
|