interscript-maps 2.2.0 → 2.2.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (192) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +300 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  18. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  19. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  21. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  23. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  25. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
  26. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
  27. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  29. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  30. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  31. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  32. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  33. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  34. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  35. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  36. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  37. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  38. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  39. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  40. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  41. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  42. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  43. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  45. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  46. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  47. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  48. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  49. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  50. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  51. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  52. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  53. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  54. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  55. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  56. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  57. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  58. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  59. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  60. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  61. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  62. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  63. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  64. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  65. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  67. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  68. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  69. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  70. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  71. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  72. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  73. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  74. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  75. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  76. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  77. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  78. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  79. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  80. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  81. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  82. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  83. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  84. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
  85. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
  86. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  87. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  88. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  89. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  90. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  91. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  92. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  93. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  94. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  95. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  96. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  97. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  98. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  99. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  100. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  101. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  102. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  103. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  104. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  105. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  106. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  107. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  108. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  109. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  110. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  111. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  112. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  113. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  114. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  115. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  116. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  117. data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
  118. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  119. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
  120. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  121. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  122. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  123. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  124. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  125. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  126. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  127. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  128. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  129. data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
  130. data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
  131. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  132. data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
  133. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  134. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
  135. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
  136. data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
  137. data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
  138. data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
  139. data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
  140. data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
  141. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  142. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  143. data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
  144. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  145. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  146. data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
  147. data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
  148. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
  149. data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
  150. data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
  151. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  152. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  153. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
  154. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  155. data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
  156. data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
  157. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
  158. data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
  159. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  160. data/maps/un-ara-Arab-Latn-1971.imp +5 -5
  161. data/maps/un-ara-Arab-Latn-1972.imp +4 -4
  162. data/maps/un-ara-Arab-Latn-2017.imp +15 -15
  163. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  164. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  165. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  166. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  167. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  168. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  169. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  170. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  171. data/maps/un-hin-Deva-Latn-2016.imp +1 -1
  172. data/maps/un-kan-Kana-Latn-2016.imp +1 -1
  173. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  174. data/maps/un-mar-Deva-Latn-2016.imp +1 -1
  175. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  176. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  177. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  178. data/maps/un-nep-Deva-Latn-1972.imp +1 -1
  179. data/maps/un-nep-Deva-Latn-2013.imp +1 -1
  180. data/maps/un-ori-Orya-Latn-1972.imp +1 -1
  181. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  182. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  183. data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
  184. data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
  185. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  186. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  187. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  188. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  189. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  190. data/maps/un-urd-Arab-Latn-1972.imp +15 -15
  191. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  192. metadata +7 -1
@@ -4,8 +4,7 @@ metadata {
4
4
  language: iso-639-2:kat
5
5
  source_script: Geor
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Georgian Personal Names 2015, ICS 630-01 Annex E
8
-
7
+ name: Romanization of Georgian Personal Names (2015), ICS 630-01 Annex E
9
8
  # url:
10
9
  source: ICS 630-01, Annex E
11
10
  creation_date: 2015
@@ -16,7 +15,7 @@ metadata {
16
15
  eliminate variations of a name that can contribute forensic information. Rather, it is to provide an
17
16
  IC standard Romanized (English) transliteration from Georgian that can then be linked to forensic
18
17
  information in ways that will help identify the referent of the name.
19
-
18
+
20
19
  notes:
21
20
  }
22
21
 
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kaz
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of kazakh personal names in written reports and products
7
+ name: Romanization of Kazakh Personal Names (2015)
8
8
  source: ICS-630-01 Annex Q
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kir
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of kyrgyz personal names in written reports and products
7
+ name: Romanization of Kyrgyz Personal Names (2015)
8
8
  source: ICS-630-01 Annex R
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kor
5
5
  source_script: Hang
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Korean 2015 System, ICS-630-01 Annex W
7
+ name: Romanization of Korean Personal Names (2015), ICS-630-01 Annex W
8
8
  url:
9
9
  creation_date: 2015
10
10
  adoption_date:
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mkd
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of macedonian personal names in written reports and products
7
+ name: Intelligence Community (IC) Standard for the Transliteration of Macedonian Personal Names (2005)
8
8
  creation_date: 2005
9
9
  confirmation_date: 2005
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mkd
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of macedonian personal names in written reports and products
7
+ name: Romanization of macedonian Personal Names (2015)
8
8
  source: ICS-630-01 Annex H
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-3:prs
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ODNI Persian Farsi Dari Personal Names 2015 System, ICS-630-01 Annex J
7
+ name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
8
8
  url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015-11
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-3:prs
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ODNI Pashto Personal Names 2011 System
7
+ name: Romanization of Pashto Personal Names (2011)
8
8
  url: https://github.com/interscript/interscript-private-references/blob/master/odni/Pashto%20June%202011.pdf
9
9
  creation_date: 2011
10
10
  confirmation_date: 2011-06
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:rus
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Russian Personal Names 2015, ICS-630-01 Annex K
7
+ name: Romanization of Russian Personal Names (2015), ICS-630-01 Annex K
8
8
 
9
9
  # url:
10
10
  source: ICS-630-01 Annex K
@@ -4,12 +4,12 @@ metadata {
4
4
  language: iso-639-2:srp
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Serbian Personal Names 2004 System
7
+ name: Intelligence Community (IC) Standard for the Transliteration of Serbian Personal Names (2004)
8
8
  creation_date: 2005
9
9
  confirmation_date: 2005
10
10
  description: |
11
11
  Office of the Director Of National Intelligence Serbian Personal Names 2004 System
12
-
12
+
13
13
  notes:
14
14
  }
15
15
 
@@ -4,8 +4,8 @@ metadata {
4
4
  language: iso-639-2:srp
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Serbian Personal Names 2015, ICS-630-01 Annex L
8
-
7
+ name: Romanization of Serbian Personal Names (2015), ICS-630-01 Annex L
8
+
9
9
  # url:
10
10
  source: ICS-630-01 Annex L
11
11
  creation_date: 2015
@@ -16,27 +16,27 @@ metadata {
16
16
  is not intended to eliminate variations of a name that can contribute forensic information. Rather,
17
17
  it is to provide an IC standard Romanized (English) transliteration from Serbian that can then be
18
18
  linked to forensic information in ways that will help identify the referent of the name.
19
-
19
+
20
20
  In cases where an individual’s name has already been transliterated in a variant spelling, the IC
21
21
  Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the first
22
22
  usage. In addition, if the original Cyrillic spelling is known, that spelling should also appear in
23
23
  parentheses following the name, if possible, following best practices of the issuing organization
24
24
  and taking into consideration information system capabilities. This convention is designed to
25
25
  ensure that vital forensic information is not lost.
26
-
26
+
27
27
  For names of persons who are known to not be part of the Serbian-speaking community, use the
28
28
  relevant IC transliteration standard for names from that language (e.g., Mikhail, Yitzhak). A
29
29
  translator’s note may be used to clarify the known origin of the person. Spell names of
30
30
  individuals from languages that are written in Roman letters as they are spelled in those
31
31
  languages (e.g., George Clooney, Jorge Garcia, Georges Pompidou).
32
-
32
+
33
33
  In the case of active senior government officials in the on-line CIA World Factbook and the online directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings
34
34
  given in these on-line reference works should be used in place of the IC Standard. For any
35
35
  individual who has at one time been listed in the Factbook or Chiefs of State directory but who no
36
36
  longer appears in those resources (i.e. is no longer a government official), the IC Standard
37
37
  spelling should appear first, with the spelling, if known, as it previously appeared in those
38
38
  resources listed within parentheses at the first usage.
39
-
39
+
40
40
  The primary goal is to produce a consistent Romanized transcription of names that is specifically
41
41
  readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
42
42
  (English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use
@@ -44,7 +44,7 @@ metadata {
44
44
  individual is provided, the referent will be clearly identified. This system will be used in
45
45
  conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
46
46
  names of well-known individuals.
47
-
47
+
48
48
  notes:
49
49
  }
50
50
 
@@ -93,7 +93,7 @@ stage {
93
93
  sub "\u0427", "C" # Ч
94
94
  sub "\u040F", "Dz" # Џ
95
95
  sub "\u0428", "S" # Ш
96
-
96
+
97
97
  sub "\u0430", "a" # а
98
98
  sub "\u0431", "b" # б
99
99
  sub "\u0432", "v" # в
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tat
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of tatar personal names in written reports and products
7
+ name: Romanization of Tatar Personal Names (2015)
8
8
  source: ICS-630-01 Annex S
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tgk
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of tajik personal names in written reports and products
7
+ name: Romanization of Tajik Personal Names (2015)
8
8
  source: ICS-630-01 Annex N
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:tuk
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of Turkmen personal names in written reports and products
7
+ name: Romanization of Turkmen Personal Names (2015)
8
8
  url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20T%20-%20Turkmen_Personal_Names_FLTS%20(U).pdf
9
9
  source: ICS-630-01 Annex T
10
10
  creation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:uig
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of uyghur personal names in written reports and products
7
+ name: Romanization of Uyghur Personal Names (2015)
8
8
  source: ICS-630-01 Annex U
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ukr
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Ukrainian Personal Names 2004 System, ICS 630-01 Annex M
7
+ name: Romanization of Ukrainian Personal Names (2015), ICS 630-01 Annex M
8
8
 
9
9
  # url:
10
10
  source: ICS 630-01, Annex M
@@ -4,8 +4,8 @@ metadata {
4
4
  language: iso-639-2:urd
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Hindi Urdu Personal Names 2015 System, ICS-630-01 Annex F
8
-
7
+ name: Romanization of Hindi and Urdu Personal Names (2015), ICS-630-01 Annex F
8
+
9
9
  #url:
10
10
  creation_date: 2015
11
11
  confirmation_date: 2015
@@ -16,7 +16,7 @@ metadata {
16
16
  forensic information. Rather, it is to provide an IC standard Romanized (English)
17
17
  transliteration from standard Hindi and Urdu that can then be linked to forensic
18
18
  information in ways that will help identify the referent of the name.
19
-
19
+
20
20
  There are typically a number of ways that names can be Romanized from either
21
21
  Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
22
22
  Romanization of Hindi and Urdu names for several reasons, including the fact that some
@@ -31,7 +31,7 @@ metadata {
31
31
  And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
32
32
  anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
33
33
  transliterations may either reflect spelling or pronunciation in such cases.
34
-
34
+
35
35
  Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
36
36
  Urdu transliterations as much as possible. In the area of names, this can become
37
37
  problematic when the Urdu spelling accurately reflects original Arabic spelling while the
@@ -40,7 +40,7 @@ metadata {
40
40
  either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
41
41
  spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
42
42
  However, this is not always possible (see Hindi va versus Urdu wau).
43
-
43
+
44
44
  In cases where an individual’s name has already been transliterated, that is to be indicated
45
45
  – as found – in parentheses immediately following its rendition in the transliteration
46
46
  standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
@@ -48,14 +48,14 @@ metadata {
48
48
  parentheses following the name, if possible, following best practices of the issuing
49
49
  organization and taking into consideration information system capabilities. This
50
50
  convention is designed to ensure that vital forensic information is not lost.
51
-
51
+
52
52
  For names of persons who are known to not be part of the Hindi- or Urdu-speaking
53
53
  community, use the relevant IC transliteration standard for names from that language
54
54
  (e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
55
55
  the person. Spell names of individuals from languages that are written in Roman letters as
56
56
  they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
57
57
  Pompidou).
58
-
58
+
59
59
  In the case of active senior government officials in the on-line CIA World Factbook and
60
60
  the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
61
61
  the spellings given in these on-line reference works should be used in place of the IC
@@ -64,7 +64,7 @@ metadata {
64
64
  government official), the IC Standard spelling should appear first, with the spelling, if
65
65
  known, as it previously appeared in those resources listed within parentheses at the first
66
66
  usage.
67
-
67
+
68
68
  The primary goal of this system is to produce a consistent Romanized transcription of the
69
69
  name that is readable to the non-specialist. The system uses the 26 letters of the standard
70
70
  (English) Roman alphabet. Some ambiguities in the Romanized form will occur without
@@ -72,16 +72,16 @@ metadata {
72
72
  information about the individual is provided, the referent will be clearly identified.
73
73
  Additionally, this system will be used in conjunction with on-line tools, name dictionaries
74
74
  and lists containing conventional spellings of names of well-known individuals
75
-
75
+
76
76
  notes:
77
-
77
+
78
78
  - |
79
79
  Long/Short Vowels: Long and short vowels are not distinguished in the system:
80
80
  The borrowed Arabic name Samir could represent two distinct names, one with a
81
81
  long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
82
82
  /ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
83
83
  distinguish between these.
84
-
84
+
85
85
  - |
86
86
  No distinction is made between: retroflex and non-retroflex consonants; and
87
87
  nasalized vowels and vowels followed by /n/.
@@ -150,8 +150,8 @@ stage {
150
150
 
151
151
  # CHARACTERS
152
152
  parallel {
153
-
154
-
153
+
154
+
155
155
  sub "\u0622", "a" # ARABIC ALEF W/MADDA ABOVE
156
156
  sub "\u0627", "a" # or u ARABIC ALEF
157
157
  sub "\u06cc", "i" # or ai or u ARABIC LETTER WAW
@@ -170,9 +170,9 @@ stage {
170
170
  sub "\u06c2", "-e" # ARABIC LETTER HEH GOAL WITH HAMZA ABOVE
171
171
  sub "\u06c1\u0650", "o" # ARABIC LETTER YEH WITH HAMZA ABOVE
172
172
  sub "\u0624", "au" # ARABIC LETTER WAW WITH HAMZA ABOVE
173
-
174
-
175
-
173
+
174
+
175
+
176
176
  sub "\u06a9", "k" # ARABIC LETTER KEHEH
177
177
  sub "\u0642", "q" # ARABIC LETTER QAF
178
178
  sub "\u062e", "kh" # ARABIC LETTER KHAH
@@ -180,14 +180,14 @@ stage {
180
180
  sub "\u063a", "gh" # ARABIC LETTER GHAIN
181
181
  sub "\u0686", "ch" # ARABIC LETTER TCHEH
182
182
  sub "\u062c", "j" # Arabic Letter Jeem
183
-
183
+
184
184
  sub "\u0632", "z" # Arabic Letter ZAIN
185
185
  sub "\u0630", "z" # Arabic Letter THAL
186
186
  sub "\u0636", "z" # Arabic Letter DAD
187
187
  sub "\u0638", "z" # Arabic Letter ZAH
188
188
  sub "\u0698", "zh" # Arabic Letter JEH
189
-
190
-
189
+
190
+
191
191
  sub "\u0679", "t" # ARABIC LETTER TTEH
192
192
  sub "\u0688", "d" # Arabic Letter DDAL
193
193
  sub "\u062f", "d" # Arabic Letter DAL
@@ -196,8 +196,8 @@ stage {
196
196
  sub "\u0637", "t" # Arabic Letter TAH
197
197
  sub "\u0646", "n" # Arabic Letter NOON
198
198
  sub "\u06ba", "n" # Arabic Letter NOON GHUNNA
199
-
200
-
199
+
200
+
201
201
  sub "\u067e", "p" # Arabic Letter PE
202
202
  sub "\u0641", "f" # Arabic Letter FEH
203
203
  sub "\u0628", "b" # Arabic Letter BEH
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:uzb
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Uzbek Personal Names 2015, ICS-630-01 Annex V
7
+ name: Romanization of Uzbek Personal Names (2015), ICS-630-01 Annex V
8
8
 
9
9
  # url:
10
10
  source: ICS-630-01 Annex V
@@ -129,20 +129,20 @@ stage {
129
129
 
130
130
 
131
131
  # Sun letters
132
- sub boundary + "\u0627\u0644\u062a", "el-t" # الت
133
- sub boundary + "\u0627\u0644\u062b", any(["el-th", "el-t"]) # الث
134
- sub boundary + "\u0627\u0644\u062f", "el-d" # الد
135
- sub boundary + "\u0627\u0644\u0630", any(["el-dh", "el-z"]) # الذ
136
- sub boundary + "\u0627\u0644\u0631", "el-r" # الر
137
- sub boundary + "\u0627\u0644\u0632", "el-z" # الز
138
- sub boundary + "\u0627\u0644\u0633", any(["el-s", "el-c"]) # الس
139
- sub boundary + "\u0627\u0644\u0634", "el-sh" # الش
140
- sub boundary + "\u0627\u0644\u0635", "el-ṣ" # الص
141
- sub boundary + "\u0627\u0644\u0636", "el-ḍ" # الض
142
- sub boundary + "\u0627\u0644\u0637", "el-ṭ" # الط
143
- sub boundary + "\u0627\u0644\u0638", any(["el-ẓ", "el-d"]) # الظ
144
- sub boundary + "\u0627\u0644\u0644", "el-l" # الل
145
- sub boundary + "\u0627\u0644\u0646", "el-n" # الن
132
+ sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "el-t" # الت
133
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), any(["el-th", "el-t"]) # الث
134
+ sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "el-d" # الد
135
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), any(["el-dh", "el-z"]) # الذ
136
+ sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "el-r" # الر
137
+ sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "el-z" # الز
138
+ sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), any(["el-s", "el-c"]) # الس
139
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "el-sh" # الش
140
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "el-ṣ" # الص
141
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "el-ḍ" # الض
142
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "el-ṭ" # الط
143
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), any(["el-ẓ", "el-d"]) # الظ
144
+ sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "el-l" # الل
145
+ sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "el-n" # الن
146
146
 
147
147
 
148
148
  # shadda
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:amh
5
5
  source_script: Ethi
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF AMHARIC -- UNGEGN 2016 System
7
+ name: Romanization of Amharic -- UNGEGN (2016)
8
8
  url: http://www.eki.ee/wgrs/rom1_am.pdf
9
9
  creation_date: 1967
10
10
  confirmation_date: 2016-03
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: 1971 "Beirut system"
7
+ name: Romanization of Arabic -- Beirut system (1971)
8
8
  url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/2nd-uncsgn-docs/E_Conf61_4_Add1_e.pdf
9
9
  creation_date: 1971
10
10
  confirmation_date: 2018-06
@@ -85,10 +85,10 @@ stage {
85
85
  parallel {
86
86
 
87
87
  # sun letters
88
- sub boundary + "\u0627\u0644\u062b", "at͟h t͟h" # الث
89
- sub boundary + "\u0627\u0644\u0630", "ad͟h d͟h" # الذ
90
- sub boundary + "\u0627\u0644\u0634", "as͟h s͟h" # الش
91
- sub boundary + "\u0627\u0644\u0638", "az͟h z͟h" # الظ
88
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "at͟h t͟h" # الث
89
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "ad͟h d͟h" # الذ
90
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "as͟h s͟h" # الش
91
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az͟h z͟h" # الظ
92
92
 
93
93
  # shadda
94
94
  sub "\u062e\u0651", "k͟hk͟h" # خ
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ROMANIZATION OF ARABIC -- UNGEGN 1972 System
7
+ name: Romanization of Arabic -- UNGEGN (1972)
8
8
  url: http://www.eki.ee/wgrs/obs_rom_vers/rom1_ar_v4_0.pdf
9
9
  creation_date: 1972
10
10
  confirmation_date: 2018-06
@@ -107,9 +107,9 @@ stage {
107
107
  # CHARACTERS
108
108
  parallel {
109
109
 
110
- sub boundary + "\u0627\u0644\u0635", "aş ş" # الص
111
- sub boundary + "\u0627\u0644\u0636", "aḑ ḑ" # الض
112
- sub boundary + "\u0627\u0644\u0637", "aţ ţ" # الط
110
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "aş ş" # الص
111
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "aḑ ḑ" # الض
112
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "aţ ţ" # الط
113
113
 
114
114
  sub "\u062d\u0651", "ḩḩ" # ح
115
115
  sub "\u0635\u0651", "şş" # ص