interscript-maps 2.2.0 → 2.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +7 -1
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: ics-630-01:ara
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Arabic Personal Names (2004)
|
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Arabic_IC_Standard.doc
|
|
9
9
|
creation_date: 2004
|
|
10
10
|
confirmation_date: 2004-06
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: ics-630-01:ara
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Arabic Personal Names (2015), ICS 630-01 Annex A
|
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20A%20-%20Arabic_Personal_Names_FLTS%20(U).pdf
|
|
9
9
|
creation_date: 2017
|
|
10
10
|
confirmation_date: 2018-06
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:aze
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Azeri Personal Names (2015), ICS 630-01 Annex P
|
|
8
8
|
source: ICS-630-01 Annex P
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:bel
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Belarusian Personal Names (2015), ICS 630-01 Annex B
|
|
8
8
|
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS 630-01, Annex B
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:bul
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names
|
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names (2005)
|
|
8
8
|
creation_date: 2005
|
|
9
9
|
description:
|
|
10
10
|
}
|
|
@@ -53,7 +53,7 @@ stage {
|
|
|
53
53
|
sub "\u042c", "Y"
|
|
54
54
|
sub "\u042e", "Yu"
|
|
55
55
|
sub "\u042f", "Ya"
|
|
56
|
-
|
|
56
|
+
|
|
57
57
|
sub "\u0430", "a"
|
|
58
58
|
sub "\u0431", "b"
|
|
59
59
|
sub "\u0432", "v"
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:bul
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Bulgarian Personal Names (2015), ICS-630-01 Annex O
|
|
8
8
|
|
|
9
9
|
# url:
|
|
10
10
|
source: ICS-630-01 Annex O
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:che
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Chechen Cyrillic Personal Names (2015)
|
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20C%20-%20Chechen_Personal_Names_FLTS%20(U).pdf
|
|
9
9
|
source: ICS-630-01 Annex C
|
|
10
10
|
creation_date: 2015
|
|
@@ -140,20 +140,20 @@ stage {
|
|
|
140
140
|
# '\uFE8E' : '' # ﺎ
|
|
141
141
|
|
|
142
142
|
# Sun letters
|
|
143
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
|
144
|
-
sub boundary + "\u0627\u0644\u062b", "as s" # الث
|
|
145
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
|
146
|
-
sub boundary + "\u0627\u0644\u0630", "az z" # الذ
|
|
147
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
|
148
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
|
149
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
|
150
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
|
151
|
-
sub boundary + "\u0627\u0644\u0635", "as s" # الص
|
|
152
|
-
sub boundary + "\u0627\u0644\u0636", "az z" # الض
|
|
153
|
-
sub boundary + "\u0627\u0644\u0637", "at t" # الط
|
|
154
|
-
sub boundary + "\u0627\u0644\u0638", "az z" # الظ
|
|
155
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
|
156
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
|
143
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
|
144
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
|
|
145
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
|
146
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
|
|
147
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
|
148
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
|
149
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
|
150
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
|
151
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
|
|
152
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
|
|
153
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
|
|
154
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
|
|
155
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
|
156
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
|
157
157
|
|
|
158
158
|
# Farsi Vowel (Pointing)
|
|
159
159
|
sub "\u0622", "a" # آ alef maddeh
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:fas
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
|
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
|
|
9
9
|
creation_date: 2015
|
|
10
10
|
confirmation_date: 2015-11
|
|
@@ -257,20 +257,20 @@ stage {
|
|
|
257
257
|
# '\uFE8E' : '' # ﺎ
|
|
258
258
|
|
|
259
259
|
# Sun letters
|
|
260
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
|
261
|
-
sub boundary + "\u0627\u0644\u062b", "as s" # الث
|
|
262
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
|
263
|
-
sub boundary + "\u0627\u0644\u0630", "az z" # الذ
|
|
264
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
|
265
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
|
266
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
|
267
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
|
268
|
-
sub boundary + "\u0627\u0644\u0635", "as s" # الص
|
|
269
|
-
sub boundary + "\u0627\u0644\u0636", "az z" # الض
|
|
270
|
-
sub boundary + "\u0627\u0644\u0637", "at t" # الط
|
|
271
|
-
sub boundary + "\u0627\u0644\u0638", "az z" # الظ
|
|
272
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
|
273
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
|
260
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
|
261
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
|
|
262
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
|
263
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
|
|
264
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
|
265
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
|
266
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
|
267
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
|
268
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
|
|
269
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
|
|
270
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
|
|
271
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
|
|
272
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
|
273
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
|
274
274
|
|
|
275
275
|
# Farsi Vowel (Pointing)
|
|
276
276
|
sub "\u0622", "a" # آ alef maddeh
|
|
@@ -4,12 +4,12 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:hin
|
|
5
5
|
source_script: Deva
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: IC
|
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Hindi and Urdu Personal Names (2004)
|
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Hindi_and_Urdu_IC_Standard.doc
|
|
9
9
|
creation_date: 2004
|
|
10
10
|
description: |
|
|
11
11
|
IC STANDARDS FOR TRANSLITERATION OF HINDI AND URDU PERSONAL NAMES
|
|
12
|
-
|
|
12
|
+
|
|
13
13
|
notes:
|
|
14
14
|
- |
|
|
15
15
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
|
@@ -69,7 +69,7 @@ stage {
|
|
|
69
69
|
|
|
70
70
|
# CHARACTERS
|
|
71
71
|
parallel {
|
|
72
|
-
|
|
72
|
+
|
|
73
73
|
#Independent vowel characters
|
|
74
74
|
sub "अ", "a"
|
|
75
75
|
sub "आ", "a"
|
|
@@ -84,7 +84,7 @@ stage {
|
|
|
84
84
|
sub "ओ", "o"
|
|
85
85
|
sub "ऑ", "au"
|
|
86
86
|
sub "औ", "au"
|
|
87
|
-
|
|
87
|
+
|
|
88
88
|
#Dependent Vowels
|
|
89
89
|
sub "ा", "a"
|
|
90
90
|
sub "ि", "i"
|
|
@@ -98,10 +98,10 @@ stage {
|
|
|
98
98
|
sub "ो", "o"
|
|
99
99
|
sub "ौ", "au"
|
|
100
100
|
sub "ॉ", "au"
|
|
101
|
-
|
|
102
|
-
|
|
101
|
+
|
|
102
|
+
|
|
103
103
|
# Consonants
|
|
104
|
-
|
|
104
|
+
|
|
105
105
|
# Gutturals
|
|
106
106
|
sub "क", "k"
|
|
107
107
|
sub "क्ष", "ksha"
|
|
@@ -112,7 +112,7 @@ stage {
|
|
|
112
112
|
sub "ग़", "gh"
|
|
113
113
|
sub "घ", "gh"
|
|
114
114
|
sub "ङ", "n"
|
|
115
|
-
|
|
115
|
+
|
|
116
116
|
# Palatals
|
|
117
117
|
sub "च", "ch"
|
|
118
118
|
sub "छ", "ch"
|
|
@@ -121,7 +121,7 @@ stage {
|
|
|
121
121
|
sub "झ", "gya"
|
|
122
122
|
sub "झ", "jh"
|
|
123
123
|
sub "ञ", "n"
|
|
124
|
-
|
|
124
|
+
|
|
125
125
|
# Cerebrals
|
|
126
126
|
sub "ट", "t"
|
|
127
127
|
sub "ठ", "th"
|
|
@@ -130,14 +130,14 @@ stage {
|
|
|
130
130
|
sub "ढ़", "rh"
|
|
131
131
|
sub "ढ", "dh"
|
|
132
132
|
sub "ण", "n"
|
|
133
|
-
|
|
133
|
+
|
|
134
134
|
# Dentals
|
|
135
135
|
sub "त", "t"
|
|
136
136
|
sub "थ", "th"
|
|
137
137
|
sub "द", "d"
|
|
138
138
|
sub "ध", "dh"
|
|
139
139
|
sub "न", "n"
|
|
140
|
-
|
|
140
|
+
|
|
141
141
|
# Labials
|
|
142
142
|
sub "प", "p"
|
|
143
143
|
sub "फ़", "f"
|
|
@@ -145,34 +145,34 @@ stage {
|
|
|
145
145
|
sub "ब", "b"
|
|
146
146
|
sub "भ", "bh"
|
|
147
147
|
sub "म", "m"
|
|
148
|
-
|
|
148
|
+
|
|
149
149
|
# Semivowels
|
|
150
150
|
sub "य", "y"
|
|
151
151
|
sub "र", "r"
|
|
152
152
|
sub "ल", "l"
|
|
153
153
|
sub "व", "v"
|
|
154
|
-
|
|
154
|
+
|
|
155
155
|
# Sibilants
|
|
156
156
|
sub "श", "sh"
|
|
157
157
|
sub "ष", "sh"
|
|
158
158
|
sub "स", "s"
|
|
159
|
-
|
|
160
|
-
|
|
159
|
+
|
|
160
|
+
|
|
161
161
|
# Aspirate
|
|
162
162
|
sub "ह", "h"
|
|
163
|
-
|
|
163
|
+
|
|
164
164
|
# Anusvāra
|
|
165
165
|
sub "ं", "n"
|
|
166
|
-
|
|
166
|
+
|
|
167
167
|
# Anunāsika
|
|
168
168
|
sub "ँ", "n"
|
|
169
|
-
|
|
169
|
+
|
|
170
170
|
# halanta
|
|
171
171
|
sub "्", ""
|
|
172
|
-
|
|
172
|
+
|
|
173
173
|
# bisharga
|
|
174
174
|
sub "ः", "h"
|
|
175
|
-
|
|
175
|
+
|
|
176
176
|
sub "़", ""
|
|
177
177
|
}
|
|
178
178
|
|
|
@@ -4,8 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:hin
|
|
5
5
|
source_script: Deva
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
8
|
-
|
|
7
|
+
name: Romanization of Hindi Urdu Personal Names (2015), ICS-630-01 Annex F
|
|
9
8
|
#url:
|
|
10
9
|
creation_date: 2015
|
|
11
10
|
confirmation_date: 2015
|
|
@@ -16,7 +15,7 @@ metadata {
|
|
|
16
15
|
forensic information. Rather, it is to provide an IC standard Romanized (English)
|
|
17
16
|
transliteration from standard Hindi and Urdu that can then be linked to forensic
|
|
18
17
|
information in ways that will help identify the referent of the name.
|
|
19
|
-
|
|
18
|
+
|
|
20
19
|
There are typically a number of ways that names can be Romanized from either
|
|
21
20
|
Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
|
|
22
21
|
Romanization of Hindi and Urdu names for several reasons, including the fact that some
|
|
@@ -31,7 +30,7 @@ metadata {
|
|
|
31
30
|
And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
|
|
32
31
|
anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
|
|
33
32
|
transliterations may either reflect spelling or pronunciation in such cases.
|
|
34
|
-
|
|
33
|
+
|
|
35
34
|
Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
|
|
36
35
|
Urdu transliterations as much as possible. In the area of names, this can become
|
|
37
36
|
problematic when the Urdu spelling accurately reflects original Arabic spelling while the
|
|
@@ -40,7 +39,7 @@ metadata {
|
|
|
40
39
|
either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
|
|
41
40
|
spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
|
|
42
41
|
However, this is not always possible (see Hindi va versus Urdu wau).
|
|
43
|
-
|
|
42
|
+
|
|
44
43
|
In cases where an individual’s name has already been transliterated, that is to be indicated
|
|
45
44
|
– as found – in parentheses immediately following its rendition in the transliteration
|
|
46
45
|
standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
|
|
@@ -48,14 +47,14 @@ metadata {
|
|
|
48
47
|
parentheses following the name, if possible, following best practices of the issuing
|
|
49
48
|
organization and taking into consideration information system capabilities. This
|
|
50
49
|
convention is designed to ensure that vital forensic information is not lost.
|
|
51
|
-
|
|
50
|
+
|
|
52
51
|
For names of persons who are known to not be part of the Hindi- or Urdu-speaking
|
|
53
52
|
community, use the relevant IC transliteration standard for names from that language
|
|
54
53
|
(e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
|
|
55
54
|
the person. Spell names of individuals from languages that are written in Roman letters as
|
|
56
55
|
they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
|
|
57
56
|
Pompidou).
|
|
58
|
-
|
|
57
|
+
|
|
59
58
|
In the case of active senior government officials in the on-line CIA World Factbook and
|
|
60
59
|
the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
|
|
61
60
|
the spellings given in these on-line reference works should be used in place of the IC
|
|
@@ -64,7 +63,7 @@ metadata {
|
|
|
64
63
|
government official), the IC Standard spelling should appear first, with the spelling, if
|
|
65
64
|
known, as it previously appeared in those resources listed within parentheses at the first
|
|
66
65
|
usage.
|
|
67
|
-
|
|
66
|
+
|
|
68
67
|
The primary goal of this system is to produce a consistent Romanized transcription of the
|
|
69
68
|
name that is readable to the non-specialist. The system uses the 26 letters of the standard
|
|
70
69
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without
|
|
@@ -72,16 +71,16 @@ metadata {
|
|
|
72
71
|
information about the individual is provided, the referent will be clearly identified.
|
|
73
72
|
Additionally, this system will be used in conjunction with on-line tools, name dictionaries
|
|
74
73
|
and lists containing conventional spellings of names of well-known individuals
|
|
75
|
-
|
|
74
|
+
|
|
76
75
|
notes:
|
|
77
|
-
|
|
76
|
+
|
|
78
77
|
- |
|
|
79
78
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
|
80
79
|
The borrowed Arabic name Samir could represent two distinct names, one with a
|
|
81
80
|
long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
|
|
82
81
|
/ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
|
|
83
82
|
distinguish between these.
|
|
84
|
-
|
|
83
|
+
|
|
85
84
|
- |
|
|
86
85
|
No distinction is made between: retroflex and non-retroflex consonants; and
|
|
87
86
|
nasalized vowels and vowels followed by /n/.
|
|
@@ -151,9 +150,9 @@ stage {
|
|
|
151
150
|
|
|
152
151
|
# CHARACTERS
|
|
153
152
|
parallel {
|
|
154
|
-
|
|
153
|
+
|
|
155
154
|
# I. Vowels and Diphthongs (see Note 1)
|
|
156
|
-
|
|
155
|
+
|
|
157
156
|
sub "अ", "a"
|
|
158
157
|
sub "आ", "a"
|
|
159
158
|
sub "इ", "i"
|
|
@@ -165,7 +164,7 @@ stage {
|
|
|
165
164
|
sub "ऐ", "ai"
|
|
166
165
|
sub "ऑ", "o"
|
|
167
166
|
sub "ओ", "au"
|
|
168
|
-
|
|
167
|
+
|
|
169
168
|
# II. Consonants (see Note 2)
|
|
170
169
|
# Gutturals
|
|
171
170
|
sub "क", "k"
|
|
@@ -177,7 +176,7 @@ stage {
|
|
|
177
176
|
sub "घ", "gh"
|
|
178
177
|
sub "ग़", "gh"
|
|
179
178
|
sub "ङ", "n"
|
|
180
|
-
|
|
179
|
+
|
|
181
180
|
# Palatals
|
|
182
181
|
sub "च", "ch"
|
|
183
182
|
sub "छ", "ch"
|
|
@@ -185,7 +184,7 @@ stage {
|
|
|
185
184
|
sub "झ", "jh"
|
|
186
185
|
sub "ज़", "z"
|
|
187
186
|
sub "ञ", "n"
|
|
188
|
-
|
|
187
|
+
|
|
189
188
|
# Cerebrals
|
|
190
189
|
sub "ट", "t"
|
|
191
190
|
sub "ठ", "th"
|
|
@@ -194,14 +193,14 @@ stage {
|
|
|
194
193
|
sub "ढ", "dh"
|
|
195
194
|
sub "ढ़", "rh"
|
|
196
195
|
sub "ण", "n"
|
|
197
|
-
|
|
196
|
+
|
|
198
197
|
# Dentals
|
|
199
198
|
sub "त", "t"
|
|
200
199
|
sub "थ", "th"
|
|
201
200
|
sub "द", "d"
|
|
202
201
|
sub "ध", "dh"
|
|
203
202
|
sub "न", "n"
|
|
204
|
-
|
|
203
|
+
|
|
205
204
|
# Labials
|
|
206
205
|
sub "प", "p"
|
|
207
206
|
sub "फ", "ph"
|
|
@@ -209,33 +208,33 @@ stage {
|
|
|
209
208
|
sub "ब", "b"
|
|
210
209
|
sub "भ", "bh"
|
|
211
210
|
sub "म", "m"
|
|
212
|
-
|
|
211
|
+
|
|
213
212
|
# Semivowels
|
|
214
213
|
sub "य", "y"
|
|
215
214
|
sub "र", "r"
|
|
216
215
|
sub "ल", "l"
|
|
217
216
|
sub "व", "v"
|
|
218
|
-
|
|
217
|
+
|
|
219
218
|
# Sibilants
|
|
220
219
|
sub "श", "sh"
|
|
221
220
|
sub "ष", "sh"
|
|
222
221
|
sub "स", "s"
|
|
223
|
-
|
|
222
|
+
|
|
224
223
|
# Aspirate
|
|
225
224
|
sub "ह", "h"
|
|
226
|
-
|
|
225
|
+
|
|
227
226
|
# Anusvāra
|
|
228
227
|
sub "ं", "n"
|
|
229
|
-
|
|
228
|
+
|
|
230
229
|
# Bisarga
|
|
231
230
|
sub "ः ", "h"
|
|
232
|
-
|
|
231
|
+
|
|
233
232
|
# Anunāsika
|
|
234
233
|
sub "ँ", "n"
|
|
235
|
-
|
|
234
|
+
|
|
236
235
|
sub "़", ""
|
|
237
236
|
sub "्", ""
|
|
238
|
-
|
|
237
|
+
|
|
239
238
|
# Medials # Needed for connecting constants
|
|
240
239
|
sub "ा", "a"
|
|
241
240
|
sub "ि", "i"
|