interscript-maps 2.1.0b6 → 2.2.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +300 -111
- data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
- data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
- data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
- data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
- data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
- data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
- data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
- data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
- data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
- data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
- data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
- data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
- data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
- data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
- data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
- data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
- data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
- data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
- data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
- data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
- data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
- data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
- data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
- data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
- data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
- data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
- data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
- data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
- data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
- data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
- data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
- data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
- data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
- data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
- data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
- data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
- data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
- data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
- data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
- data/maps/un-ara-Arab-Latn-1971.imp +5 -5
- data/maps/un-ara-Arab-Latn-1972.imp +4 -4
- data/maps/un-ara-Arab-Latn-2017.imp +15 -15
- data/maps/un-asm-Beng-Latn-1972.imp +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
- data/maps/un-ben-Beng-Latn-2016.imp +1 -1
- data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
- data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
- data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
- data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-pan-Guru-Latn-1972.imp +1 -1
- data/maps/un-prs-Arab-Latn-1967.imp +15 -15
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
- data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
- data/maps/un-tam-Taml-Latn-1972.imp +1 -1
- data/maps/un-tel-Telu-Latn-1972.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
- data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
- data/maps/un-urd-Arab-Latn-1972.imp +15 -15
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
- metadata +9 -3
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: ics-630-01:ara
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Arabic Personal Names (2004)
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Arabic_IC_Standard.doc
|
9
9
|
creation_date: 2004
|
10
10
|
confirmation_date: 2004-06
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: ics-630-01:ara
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Arabic Personal Names (2015), ICS 630-01 Annex A
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20A%20-%20Arabic_Personal_Names_FLTS%20(U).pdf
|
9
9
|
creation_date: 2017
|
10
10
|
confirmation_date: 2018-06
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:aze
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Azeri Personal Names (2015), ICS 630-01 Annex P
|
8
8
|
source: ICS-630-01 Annex P
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:bel
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Belarusian Personal Names (2015), ICS 630-01 Annex B
|
8
8
|
|
9
9
|
# url:
|
10
10
|
source: ICS 630-01, Annex B
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:bul
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names (2005)
|
8
8
|
creation_date: 2005
|
9
9
|
description:
|
10
10
|
}
|
@@ -53,7 +53,7 @@ stage {
|
|
53
53
|
sub "\u042c", "Y"
|
54
54
|
sub "\u042e", "Yu"
|
55
55
|
sub "\u042f", "Ya"
|
56
|
-
|
56
|
+
|
57
57
|
sub "\u0430", "a"
|
58
58
|
sub "\u0431", "b"
|
59
59
|
sub "\u0432", "v"
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:bul
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Bulgarian Personal Names (2015), ICS-630-01 Annex O
|
8
8
|
|
9
9
|
# url:
|
10
10
|
source: ICS-630-01 Annex O
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:che
|
5
5
|
source_script: Cyrl
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Chechen Cyrillic Personal Names (2015)
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20C%20-%20Chechen_Personal_Names_FLTS%20(U).pdf
|
9
9
|
source: ICS-630-01 Annex C
|
10
10
|
creation_date: 2015
|
@@ -140,20 +140,20 @@ stage {
|
|
140
140
|
# '\uFE8E' : '' # ﺎ
|
141
141
|
|
142
142
|
# Sun letters
|
143
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
144
|
-
sub boundary + "\u0627\u0644\u062b", "as s" # الث
|
145
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
146
|
-
sub boundary + "\u0627\u0644\u0630", "az z" # الذ
|
147
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
148
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
149
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
150
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
151
|
-
sub boundary + "\u0627\u0644\u0635", "as s" # الص
|
152
|
-
sub boundary + "\u0627\u0644\u0636", "az z" # الض
|
153
|
-
sub boundary + "\u0627\u0644\u0637", "at t" # الط
|
154
|
-
sub boundary + "\u0627\u0644\u0638", "az z" # الظ
|
155
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
156
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
143
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
144
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
|
145
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
146
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
|
147
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
148
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
149
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
150
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
151
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
|
152
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
|
153
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
|
154
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
|
155
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
156
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
157
157
|
|
158
158
|
# Farsi Vowel (Pointing)
|
159
159
|
sub "\u0622", "a" # آ alef maddeh
|
@@ -4,7 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:fas
|
5
5
|
source_script: Arab
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
7
|
+
name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
|
8
8
|
url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
|
9
9
|
creation_date: 2015
|
10
10
|
confirmation_date: 2015-11
|
@@ -257,20 +257,20 @@ stage {
|
|
257
257
|
# '\uFE8E' : '' # ﺎ
|
258
258
|
|
259
259
|
# Sun letters
|
260
|
-
sub boundary + "\u0627\u0644\u062a", "at t" # الت
|
261
|
-
sub boundary + "\u0627\u0644\u062b", "as s" # الث
|
262
|
-
sub boundary + "\u0627\u0644\u062f", "ad d" # الد
|
263
|
-
sub boundary + "\u0627\u0644\u0630", "az z" # الذ
|
264
|
-
sub boundary + "\u0627\u0644\u0631", "ar r" # الر
|
265
|
-
sub boundary + "\u0627\u0644\u0632", "az z" # الز
|
266
|
-
sub boundary + "\u0627\u0644\u0633", "as s" # الس
|
267
|
-
sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
|
268
|
-
sub boundary + "\u0627\u0644\u0635", "as s" # الص
|
269
|
-
sub boundary + "\u0627\u0644\u0636", "az z" # الض
|
270
|
-
sub boundary + "\u0627\u0644\u0637", "at t" # الط
|
271
|
-
sub boundary + "\u0627\u0644\u0638", "az z" # الظ
|
272
|
-
sub boundary + "\u0627\u0644\u0644", "al l" # الل
|
273
|
-
sub boundary + "\u0627\u0644\u0646", "an n" # الن
|
260
|
+
sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
|
261
|
+
sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
|
262
|
+
sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
|
263
|
+
sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
|
264
|
+
sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
|
265
|
+
sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
|
266
|
+
sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
|
267
|
+
sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
|
268
|
+
sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
|
269
|
+
sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
|
270
|
+
sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
|
271
|
+
sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
|
272
|
+
sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
|
273
|
+
sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
|
274
274
|
|
275
275
|
# Farsi Vowel (Pointing)
|
276
276
|
sub "\u0622", "a" # آ alef maddeh
|
@@ -4,12 +4,12 @@ metadata {
|
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name: IC
|
7
|
+
name: Intelligence Community (IC) Standard for the Transliteration of Hindi and Urdu Personal Names (2004)
|
8
8
|
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Hindi_and_Urdu_IC_Standard.doc
|
9
9
|
creation_date: 2004
|
10
10
|
description: |
|
11
11
|
IC STANDARDS FOR TRANSLITERATION OF HINDI AND URDU PERSONAL NAMES
|
12
|
-
|
12
|
+
|
13
13
|
notes:
|
14
14
|
- |
|
15
15
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
@@ -69,7 +69,7 @@ stage {
|
|
69
69
|
|
70
70
|
# CHARACTERS
|
71
71
|
parallel {
|
72
|
-
|
72
|
+
|
73
73
|
#Independent vowel characters
|
74
74
|
sub "अ", "a"
|
75
75
|
sub "आ", "a"
|
@@ -84,7 +84,7 @@ stage {
|
|
84
84
|
sub "ओ", "o"
|
85
85
|
sub "ऑ", "au"
|
86
86
|
sub "औ", "au"
|
87
|
-
|
87
|
+
|
88
88
|
#Dependent Vowels
|
89
89
|
sub "ा", "a"
|
90
90
|
sub "ि", "i"
|
@@ -98,10 +98,10 @@ stage {
|
|
98
98
|
sub "ो", "o"
|
99
99
|
sub "ौ", "au"
|
100
100
|
sub "ॉ", "au"
|
101
|
-
|
102
|
-
|
101
|
+
|
102
|
+
|
103
103
|
# Consonants
|
104
|
-
|
104
|
+
|
105
105
|
# Gutturals
|
106
106
|
sub "क", "k"
|
107
107
|
sub "क्ष", "ksha"
|
@@ -112,7 +112,7 @@ stage {
|
|
112
112
|
sub "ग़", "gh"
|
113
113
|
sub "घ", "gh"
|
114
114
|
sub "ङ", "n"
|
115
|
-
|
115
|
+
|
116
116
|
# Palatals
|
117
117
|
sub "च", "ch"
|
118
118
|
sub "छ", "ch"
|
@@ -121,7 +121,7 @@ stage {
|
|
121
121
|
sub "झ", "gya"
|
122
122
|
sub "झ", "jh"
|
123
123
|
sub "ञ", "n"
|
124
|
-
|
124
|
+
|
125
125
|
# Cerebrals
|
126
126
|
sub "ट", "t"
|
127
127
|
sub "ठ", "th"
|
@@ -130,14 +130,14 @@ stage {
|
|
130
130
|
sub "ढ़", "rh"
|
131
131
|
sub "ढ", "dh"
|
132
132
|
sub "ण", "n"
|
133
|
-
|
133
|
+
|
134
134
|
# Dentals
|
135
135
|
sub "त", "t"
|
136
136
|
sub "थ", "th"
|
137
137
|
sub "द", "d"
|
138
138
|
sub "ध", "dh"
|
139
139
|
sub "न", "n"
|
140
|
-
|
140
|
+
|
141
141
|
# Labials
|
142
142
|
sub "प", "p"
|
143
143
|
sub "फ़", "f"
|
@@ -145,34 +145,34 @@ stage {
|
|
145
145
|
sub "ब", "b"
|
146
146
|
sub "भ", "bh"
|
147
147
|
sub "म", "m"
|
148
|
-
|
148
|
+
|
149
149
|
# Semivowels
|
150
150
|
sub "य", "y"
|
151
151
|
sub "र", "r"
|
152
152
|
sub "ल", "l"
|
153
153
|
sub "व", "v"
|
154
|
-
|
154
|
+
|
155
155
|
# Sibilants
|
156
156
|
sub "श", "sh"
|
157
157
|
sub "ष", "sh"
|
158
158
|
sub "स", "s"
|
159
|
-
|
160
|
-
|
159
|
+
|
160
|
+
|
161
161
|
# Aspirate
|
162
162
|
sub "ह", "h"
|
163
|
-
|
163
|
+
|
164
164
|
# Anusvāra
|
165
165
|
sub "ं", "n"
|
166
|
-
|
166
|
+
|
167
167
|
# Anunāsika
|
168
168
|
sub "ँ", "n"
|
169
|
-
|
169
|
+
|
170
170
|
# halanta
|
171
171
|
sub "्", ""
|
172
|
-
|
172
|
+
|
173
173
|
# bisharga
|
174
174
|
sub "ः", "h"
|
175
|
-
|
175
|
+
|
176
176
|
sub "़", ""
|
177
177
|
}
|
178
178
|
|
@@ -4,8 +4,7 @@ metadata {
|
|
4
4
|
language: iso-639-2:hin
|
5
5
|
source_script: Deva
|
6
6
|
destination_script: Latn
|
7
|
-
name:
|
8
|
-
|
7
|
+
name: Romanization of Hindi Urdu Personal Names (2015), ICS-630-01 Annex F
|
9
8
|
#url:
|
10
9
|
creation_date: 2015
|
11
10
|
confirmation_date: 2015
|
@@ -16,7 +15,7 @@ metadata {
|
|
16
15
|
forensic information. Rather, it is to provide an IC standard Romanized (English)
|
17
16
|
transliteration from standard Hindi and Urdu that can then be linked to forensic
|
18
17
|
information in ways that will help identify the referent of the name.
|
19
|
-
|
18
|
+
|
20
19
|
There are typically a number of ways that names can be Romanized from either
|
21
20
|
Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
|
22
21
|
Romanization of Hindi and Urdu names for several reasons, including the fact that some
|
@@ -31,7 +30,7 @@ metadata {
|
|
31
30
|
And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
|
32
31
|
anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
|
33
32
|
transliterations may either reflect spelling or pronunciation in such cases.
|
34
|
-
|
33
|
+
|
35
34
|
Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
|
36
35
|
Urdu transliterations as much as possible. In the area of names, this can become
|
37
36
|
problematic when the Urdu spelling accurately reflects original Arabic spelling while the
|
@@ -40,7 +39,7 @@ metadata {
|
|
40
39
|
either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
|
41
40
|
spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
|
42
41
|
However, this is not always possible (see Hindi va versus Urdu wau).
|
43
|
-
|
42
|
+
|
44
43
|
In cases where an individual’s name has already been transliterated, that is to be indicated
|
45
44
|
– as found – in parentheses immediately following its rendition in the transliteration
|
46
45
|
standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
|
@@ -48,14 +47,14 @@ metadata {
|
|
48
47
|
parentheses following the name, if possible, following best practices of the issuing
|
49
48
|
organization and taking into consideration information system capabilities. This
|
50
49
|
convention is designed to ensure that vital forensic information is not lost.
|
51
|
-
|
50
|
+
|
52
51
|
For names of persons who are known to not be part of the Hindi- or Urdu-speaking
|
53
52
|
community, use the relevant IC transliteration standard for names from that language
|
54
53
|
(e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
|
55
54
|
the person. Spell names of individuals from languages that are written in Roman letters as
|
56
55
|
they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
|
57
56
|
Pompidou).
|
58
|
-
|
57
|
+
|
59
58
|
In the case of active senior government officials in the on-line CIA World Factbook and
|
60
59
|
the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
|
61
60
|
the spellings given in these on-line reference works should be used in place of the IC
|
@@ -64,7 +63,7 @@ metadata {
|
|
64
63
|
government official), the IC Standard spelling should appear first, with the spelling, if
|
65
64
|
known, as it previously appeared in those resources listed within parentheses at the first
|
66
65
|
usage.
|
67
|
-
|
66
|
+
|
68
67
|
The primary goal of this system is to produce a consistent Romanized transcription of the
|
69
68
|
name that is readable to the non-specialist. The system uses the 26 letters of the standard
|
70
69
|
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without
|
@@ -72,16 +71,16 @@ metadata {
|
|
72
71
|
information about the individual is provided, the referent will be clearly identified.
|
73
72
|
Additionally, this system will be used in conjunction with on-line tools, name dictionaries
|
74
73
|
and lists containing conventional spellings of names of well-known individuals
|
75
|
-
|
74
|
+
|
76
75
|
notes:
|
77
|
-
|
76
|
+
|
78
77
|
- |
|
79
78
|
Long/Short Vowels: Long and short vowels are not distinguished in the system:
|
80
79
|
The borrowed Arabic name Samir could represent two distinct names, one with a
|
81
80
|
long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
|
82
81
|
/ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
|
83
82
|
distinguish between these.
|
84
|
-
|
83
|
+
|
85
84
|
- |
|
86
85
|
No distinction is made between: retroflex and non-retroflex consonants; and
|
87
86
|
nasalized vowels and vowels followed by /n/.
|
@@ -151,9 +150,9 @@ stage {
|
|
151
150
|
|
152
151
|
# CHARACTERS
|
153
152
|
parallel {
|
154
|
-
|
153
|
+
|
155
154
|
# I. Vowels and Diphthongs (see Note 1)
|
156
|
-
|
155
|
+
|
157
156
|
sub "अ", "a"
|
158
157
|
sub "आ", "a"
|
159
158
|
sub "इ", "i"
|
@@ -165,7 +164,7 @@ stage {
|
|
165
164
|
sub "ऐ", "ai"
|
166
165
|
sub "ऑ", "o"
|
167
166
|
sub "ओ", "au"
|
168
|
-
|
167
|
+
|
169
168
|
# II. Consonants (see Note 2)
|
170
169
|
# Gutturals
|
171
170
|
sub "क", "k"
|
@@ -177,7 +176,7 @@ stage {
|
|
177
176
|
sub "घ", "gh"
|
178
177
|
sub "ग़", "gh"
|
179
178
|
sub "ङ", "n"
|
180
|
-
|
179
|
+
|
181
180
|
# Palatals
|
182
181
|
sub "च", "ch"
|
183
182
|
sub "छ", "ch"
|
@@ -185,7 +184,7 @@ stage {
|
|
185
184
|
sub "झ", "jh"
|
186
185
|
sub "ज़", "z"
|
187
186
|
sub "ञ", "n"
|
188
|
-
|
187
|
+
|
189
188
|
# Cerebrals
|
190
189
|
sub "ट", "t"
|
191
190
|
sub "ठ", "th"
|
@@ -194,14 +193,14 @@ stage {
|
|
194
193
|
sub "ढ", "dh"
|
195
194
|
sub "ढ़", "rh"
|
196
195
|
sub "ण", "n"
|
197
|
-
|
196
|
+
|
198
197
|
# Dentals
|
199
198
|
sub "त", "t"
|
200
199
|
sub "थ", "th"
|
201
200
|
sub "द", "d"
|
202
201
|
sub "ध", "dh"
|
203
202
|
sub "न", "n"
|
204
|
-
|
203
|
+
|
205
204
|
# Labials
|
206
205
|
sub "प", "p"
|
207
206
|
sub "फ", "ph"
|
@@ -209,33 +208,33 @@ stage {
|
|
209
208
|
sub "ब", "b"
|
210
209
|
sub "भ", "bh"
|
211
210
|
sub "म", "m"
|
212
|
-
|
211
|
+
|
213
212
|
# Semivowels
|
214
213
|
sub "य", "y"
|
215
214
|
sub "र", "r"
|
216
215
|
sub "ल", "l"
|
217
216
|
sub "व", "v"
|
218
|
-
|
217
|
+
|
219
218
|
# Sibilants
|
220
219
|
sub "श", "sh"
|
221
220
|
sub "ष", "sh"
|
222
221
|
sub "स", "s"
|
223
|
-
|
222
|
+
|
224
223
|
# Aspirate
|
225
224
|
sub "ह", "h"
|
226
|
-
|
225
|
+
|
227
226
|
# Anusvāra
|
228
227
|
sub "ं", "n"
|
229
|
-
|
228
|
+
|
230
229
|
# Bisarga
|
231
230
|
sub "ः ", "h"
|
232
|
-
|
231
|
+
|
233
232
|
# Anunāsika
|
234
233
|
sub "ँ", "n"
|
235
|
-
|
234
|
+
|
236
235
|
sub "़", ""
|
237
236
|
sub "्", ""
|
238
|
-
|
237
|
+
|
239
238
|
# Medials # Needed for connecting constants
|
240
239
|
sub "ा", "a"
|
241
240
|
sub "ि", "i"
|