interscript-maps 2.1.0b6 → 2.2.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (192) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +300 -111
  4. data/maps/acadsin-zho-Hani-Latn-2002.imp +2 -2
  5. data/maps/alalc-amh-Ethi-Latn-1997.imp +18 -14
  6. data/maps/alalc-amh-Ethi-Latn-2011.imp +1 -1
  7. data/maps/alalc-ara-Arab-Latn-1997.imp +1 -1
  8. data/maps/alalc-asm-Deva-Latn-1997.imp +1 -1
  9. data/maps/alalc-asm-Deva-Latn-2012.imp +1 -1
  10. data/maps/alalc-aze-Arab-Latn-1997.imp +1 -1
  11. data/maps/alalc-aze-Cyrl-Latn-1997.imp +1 -1
  12. data/maps/alalc-bel-Cyrl-Latn-1997.imp +4 -4
  13. data/maps/alalc-ben-Beng-Latn-1997.imp +1 -1
  14. data/maps/alalc-ben-Beng-Latn-2017.imp +1 -1
  15. data/maps/alalc-bul-Cyrl-Latn-1997.imp +1 -1
  16. data/maps/alalc-div-Thaa-Latn-1997.imp +1 -1
  17. data/maps/alalc-ell-Grek-Latn-1997.imp +1 -1
  18. data/maps/alalc-ell-Grek-Latn-2010.imp +1 -1
  19. data/maps/alalc-guj-Gujr-Latn-1997.imp +1 -1
  20. data/maps/alalc-guj-Gujr-Latn-2011.imp +1 -1
  21. data/maps/alalc-hin-Deva-Latn-1997.imp +1 -1
  22. data/maps/alalc-hin-Deva-Latn-2011.imp +1 -1
  23. data/maps/alalc-kan-Kana-Latn-1997.imp +1 -1
  24. data/maps/alalc-kan-Kana-Latn-2011.imp +1 -1
  25. data/maps/alalc-kat-Geok-Latn-1997.imp +3 -3
  26. data/maps/alalc-kat-Geor-Latn-1997.imp +12 -12
  27. data/maps/alalc-kor-Hang-Latn-1997.imp +1 -1
  28. data/maps/alalc-mal-Mlym-Latn-1997.imp +1 -1
  29. data/maps/alalc-mar-Deva-Latn-1997.imp +1 -1
  30. data/maps/alalc-mar-Deva-Latn-2011.imp +1 -1
  31. data/maps/alalc-mkd-Cyrl-Latn-1997.imp +2 -2
  32. data/maps/alalc-mkd-Cyrl-Latn-2013.imp +2 -2
  33. data/maps/alalc-mon-Cyrl-Latn-1997.imp +3 -3
  34. data/maps/alalc-ori-Orya-Latn-1997.imp +1 -1
  35. data/maps/alalc-ori-Orya-Latn-2011.imp +1 -1
  36. data/maps/alalc-pan-Guru-Latn-1997.imp +1 -1
  37. data/maps/alalc-pan-Guru-Latn-2011.imp +1 -1
  38. data/maps/alalc-per-Arab-Latn-1997.imp +1 -1
  39. data/maps/alalc-pli-Deva-Latn-2012.imp +1 -1
  40. data/maps/alalc-pra-Deva-Latn-2012.imp +1 -1
  41. data/maps/alalc-rus-Cyrl-Latn-1997.imp +2 -2
  42. data/maps/alalc-rus-Cyrl-Latn-2012.imp +1 -1
  43. data/maps/alalc-san-Deva-Latn-2012.imp +1 -1
  44. data/maps/alalc-sin-Sinh-Latn-1997.imp +1 -1
  45. data/maps/alalc-sin-Sinh-Latn-2011.imp +1 -1
  46. data/maps/alalc-srp-Cyrl-Latn-1997.imp +2 -2
  47. data/maps/alalc-srp-Cyrl-Latn-2013.imp +1 -1
  48. data/maps/alalc-tam-Taml-Latn-1997.imp +1 -1
  49. data/maps/alalc-tam-Taml-Latn-2011.imp +1 -1
  50. data/maps/alalc-tel-Telu-Latn-1997.imp +2 -2
  51. data/maps/alalc-tel-Telu-Latn-2011.imp +1 -1
  52. data/maps/alalc-tir-Ethi-Latn-1997.imp +429 -0
  53. data/maps/alalc-tir-Ethi-Latn-2011.imp +85 -0
  54. data/maps/alalc-ukr-Cyrl-Latn-1997.imp +1 -1
  55. data/maps/alalc-ukr-Cyrl-Latn-2011.imp +1 -1
  56. data/maps/apcbg-bul-Cyrl-Latn-1995.imp +7 -4
  57. data/maps/az-aze-Cyrl-Latn-1939.imp +1 -0
  58. data/maps/az-aze-Cyrl-Latn-1958.imp +1 -0
  59. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +5 -5
  60. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  61. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  62. data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +11 -11
  63. data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +1 -1
  64. data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +2 -2
  65. data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +2 -2
  66. data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +10 -4
  67. data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +1 -1
  68. data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +1 -1
  69. data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +4 -4
  70. data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +1 -1
  71. data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +1 -1
  72. data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +1 -1
  73. data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +4 -3
  74. data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +1 -1
  75. data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +1 -1
  76. data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +2 -2
  77. data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +1 -1
  78. data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +1 -1
  79. data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +8 -8
  80. data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +2 -2
  81. data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +4 -4
  82. data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +3 -3
  83. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  84. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +4 -4
  85. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +4 -3
  86. data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +1 -1
  87. data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +2 -2
  88. data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +1 -1
  89. data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +3 -3
  90. data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +4 -4
  91. data/maps/bgnpcgn-per-Arab-Latn-1958.imp +19 -19
  92. data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +15 -15
  93. data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +15 -15
  94. data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +16 -16
  95. data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +2 -2
  96. data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +5 -5
  97. data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +1 -1
  98. data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +1 -1
  99. data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +5 -3
  100. data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +1 -1
  101. data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +1 -1
  102. data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +1 -1
  103. data/maps/bgnpcgn-tir-Ethi-Latn-2007.imp +511 -0
  104. data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +1 -1
  105. data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +1 -1
  106. data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +15 -15
  107. data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +3 -3
  108. data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +1 -1
  109. data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +1 -1
  110. data/maps/by-bel-Cyrl-Latn-2007.imp +7 -5
  111. data/maps/dos-nep-Deva-Latn-1997.imp +2 -2
  112. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  113. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  114. data/maps/ggg-kat-Geor-Latn-2002.imp +3 -3
  115. data/maps/gki-bel-Cyrl-Latn-2000.imp +1 -1
  116. data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +1 -1
  117. data/maps/iso-ara-Arab-Latn-233-1984.imp +14 -14
  118. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  119. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +14 -14
  120. data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +5 -5
  121. data/maps/mext-jpn-Hrkt-Latn-1954.imp +2 -1
  122. data/maps/moct-kor-Hang-Latn-2000.imp +1 -1
  123. data/maps/mofa-jpn-Hrkt-Latn-1989.imp +1 -1
  124. data/maps/mv-div-Thaa-Latn-1987.imp +1 -1
  125. data/maps/mvd-bel-Cyrl-Latn-2008.imp +5 -5
  126. data/maps/mvd-bel-Cyrl-Latn-2010.imp +2 -5
  127. data/maps/mvd-rus-Cyrl-Latn-2008.imp +4 -3
  128. data/maps/mvd-rus-Cyrl-Latn-2010.imp +2 -5
  129. data/maps/odni-ara-Arab-Latn-2004.imp +1 -1
  130. data/maps/odni-ara-Arab-Latn-2015.imp +1 -1
  131. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  132. data/maps/odni-bel-Cyrl-Latn-2015.imp +1 -1
  133. data/maps/odni-bul-Cyrl-Latn-2005.imp +2 -2
  134. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -1
  135. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -1
  136. data/maps/odni-fas-Arab-Latn-2004.imp +14 -14
  137. data/maps/odni-fas-Arab-Latn-2015.imp +15 -15
  138. data/maps/odni-hin-Deva-Latn-2004.imp +20 -20
  139. data/maps/odni-hin-Deva-Latn-2015.imp +25 -26
  140. data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
  141. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  142. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  143. data/maps/odni-kor-Hang-Latn-2015.imp +1 -1
  144. data/maps/odni-mkd-Cyrl-Latn-2005.imp +1 -1
  145. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  146. data/maps/odni-prs-Arab-Latn-2015.imp +1 -1
  147. data/maps/odni-pus-Arab-Latn-2011.imp +1 -1
  148. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -1
  149. data/maps/odni-srp-Cyrl-Latn-2005.imp +2 -2
  150. data/maps/odni-srp-Cyrl-Latn-2015.imp +8 -8
  151. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  152. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  153. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -1
  154. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  155. data/maps/odni-ukr-Cyrl-Latn-2015.imp +1 -1
  156. data/maps/odni-urd-Arab-Latn-2015.imp +21 -21
  157. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -1
  158. data/maps/ses-ara-Arab-Latn-1930.imp +14 -14
  159. data/maps/un-amh-Ethi-Latn-2016.imp +1 -1
  160. data/maps/un-ara-Arab-Latn-1971.imp +5 -5
  161. data/maps/un-ara-Arab-Latn-1972.imp +4 -4
  162. data/maps/un-ara-Arab-Latn-2017.imp +15 -15
  163. data/maps/un-asm-Beng-Latn-1972.imp +1 -1
  164. data/maps/un-bel-Cyrl-Latn-2007.imp +2 -2
  165. data/maps/un-ben-Beng-Latn-2016.imp +1 -1
  166. data/maps/un-bul-Cyrl-Latn-1977.imp +197 -0
  167. data/maps/un-ell-Grek-Latn-1987-phonetic.imp +5 -1
  168. data/maps/un-ell-Grek-Latn-1987-tl.imp +1 -1
  169. data/maps/un-ell-Grek-Latn-1987-ts.imp +2 -2
  170. data/maps/un-guj-Gujr-Latn-1972.imp +1 -1
  171. data/maps/un-hin-Deva-Latn-2016.imp +1 -1
  172. data/maps/un-kan-Kana-Latn-2016.imp +1 -1
  173. data/maps/un-mal-Mlym-Latn-1972.imp +1 -1
  174. data/maps/un-mar-Deva-Latn-2016.imp +1 -1
  175. data/maps/un-mkd-Cyrl-Latn-1977.imp +119 -0
  176. data/maps/un-mon-Mong-Latn-general-2013.imp +1 -1
  177. data/maps/un-mon-Mong-Latn-phonetic-2013.imp +1 -1
  178. data/maps/un-nep-Deva-Latn-1972.imp +1 -1
  179. data/maps/un-nep-Deva-Latn-2013.imp +1 -1
  180. data/maps/un-ori-Orya-Latn-1972.imp +1 -1
  181. data/maps/un-pan-Guru-Latn-1972.imp +1 -1
  182. data/maps/un-prs-Arab-Latn-1967.imp +15 -15
  183. data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
  184. data/maps/un-sin-Sinh-Latn-1972.imp +1 -1
  185. data/maps/un-srp-Cyrl-Latn-1997.imp +47 -0
  186. data/maps/un-tam-Taml-Latn-1972.imp +1 -1
  187. data/maps/un-tel-Telu-Latn-1972.imp +1 -1
  188. data/maps/un-ukr-Cyrl-Latn-1998.imp +1 -1
  189. data/maps/un-ukr-Cyrl-Latn-2012.imp +1 -1
  190. data/maps/un-urd-Arab-Latn-1972.imp +15 -15
  191. data/maps/var-amh-Ethi-Latn-eae-2003.imp +48 -43
  192. metadata +9 -3
@@ -4,7 +4,7 @@ metadata {
4
4
  language: ics-630-01:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Arabic Personal Names Office of the Director Of National Intelligence 2004 System
7
+ name: Intelligence Community (IC) Standard for the Transliteration of Arabic Personal Names (2004)
8
8
  url: https://github.com/interscript/interscript-private-references/blob/master/odni/Arabic_IC_Standard.doc
9
9
  creation_date: 2004
10
10
  confirmation_date: 2004-06
@@ -4,7 +4,7 @@ metadata {
4
4
  language: ics-630-01:ara
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Arabic Personal Names 2015 System
7
+ name: Romanization of Arabic Personal Names (2015), ICS 630-01 Annex A
8
8
  url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20A%20-%20Arabic_Personal_Names_FLTS%20(U).pdf
9
9
  creation_date: 2017
10
10
  confirmation_date: 2018-06
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:aze
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Standards for the transliteration of azeri personal names in written reports and products
7
+ name: Romanization of Azeri Personal Names (2015), ICS 630-01 Annex P
8
8
  source: ICS-630-01 Annex P
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bel
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Belarusian Personal Names 2015, ICS 630-01 Annex B
7
+ name: Romanization of Belarusian Personal Names (2015), ICS 630-01 Annex B
8
8
 
9
9
  # url:
10
10
  source: ICS 630-01, Annex B
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bul
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names
7
+ name: Intelligence Community (IC) Standard for the Transliteration of Bulgarian Personal Names (2005)
8
8
  creation_date: 2005
9
9
  description:
10
10
  }
@@ -53,7 +53,7 @@ stage {
53
53
  sub "\u042c", "Y"
54
54
  sub "\u042e", "Yu"
55
55
  sub "\u042f", "Ya"
56
-
56
+
57
57
  sub "\u0430", "a"
58
58
  sub "\u0431", "b"
59
59
  sub "\u0432", "v"
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:bul
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Bulgarian Personal Names 2015, ICS-630-01 Annex O
7
+ name: Romanization of Bulgarian Personal Names (2015), ICS-630-01 Annex O
8
8
 
9
9
  # url:
10
10
  source: ICS-630-01 Annex O
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:che
5
5
  source_script: Cyrl
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence -- ICS 630-01 -- Chechen Cyrillic 2015
7
+ name: Romanization of Chechen Cyrillic Personal Names (2015)
8
8
  url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20C%20-%20Chechen_Personal_Names_FLTS%20(U).pdf
9
9
  source: ICS-630-01 Annex C
10
10
  creation_date: 2015
@@ -140,20 +140,20 @@ stage {
140
140
  # '\uFE8E' : '' # ﺎ
141
141
 
142
142
  # Sun letters
143
- sub boundary + "\u0627\u0644\u062a", "at t" # الت
144
- sub boundary + "\u0627\u0644\u062b", "as s" # الث
145
- sub boundary + "\u0627\u0644\u062f", "ad d" # الد
146
- sub boundary + "\u0627\u0644\u0630", "az z" # الذ
147
- sub boundary + "\u0627\u0644\u0631", "ar r" # الر
148
- sub boundary + "\u0627\u0644\u0632", "az z" # الز
149
- sub boundary + "\u0627\u0644\u0633", "as s" # الس
150
- sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
151
- sub boundary + "\u0627\u0644\u0635", "as s" # الص
152
- sub boundary + "\u0627\u0644\u0636", "az z" # الض
153
- sub boundary + "\u0627\u0644\u0637", "at t" # الط
154
- sub boundary + "\u0627\u0644\u0638", "az z" # الظ
155
- sub boundary + "\u0627\u0644\u0644", "al l" # الل
156
- sub boundary + "\u0627\u0644\u0646", "an n" # الن
143
+ sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
144
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
145
+ sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
146
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
147
+ sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
148
+ sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
149
+ sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
150
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
151
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
152
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
153
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
154
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
155
+ sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
156
+ sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
157
157
 
158
158
  # Farsi Vowel (Pointing)
159
159
  sub "\u0622", "a" # آ alef maddeh
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:fas
5
5
  source_script: Arab
6
6
  destination_script: Latn
7
- name: ODNI Persian Farsi Dari Personal Names 2015 System, ICS-630-01 Annex J
7
+ name: Romanization of Persian Farsi Dari Personal Names (2015), ICS-630-01 Annex J
8
8
  url: https://github.com/interscript/ics-630-01/blob/master/reference-docs/ANNEX%20J%20-%20Persian-Farsi_Dari_Personal_Names_FLTS_2018_Revision%20(U).pdf
9
9
  creation_date: 2015
10
10
  confirmation_date: 2015-11
@@ -257,20 +257,20 @@ stage {
257
257
  # '\uFE8E' : '' # ﺎ
258
258
 
259
259
  # Sun letters
260
- sub boundary + "\u0627\u0644\u062a", "at t" # الت
261
- sub boundary + "\u0627\u0644\u062b", "as s" # الث
262
- sub boundary + "\u0627\u0644\u062f", "ad d" # الد
263
- sub boundary + "\u0627\u0644\u0630", "az z" # الذ
264
- sub boundary + "\u0627\u0644\u0631", "ar r" # الر
265
- sub boundary + "\u0627\u0644\u0632", "az z" # الز
266
- sub boundary + "\u0627\u0644\u0633", "as s" # الس
267
- sub boundary + "\u0627\u0644\u0634", "ash sh" # الش
268
- sub boundary + "\u0627\u0644\u0635", "as s" # الص
269
- sub boundary + "\u0627\u0644\u0636", "az z" # الض
270
- sub boundary + "\u0627\u0644\u0637", "at t" # الط
271
- sub boundary + "\u0627\u0644\u0638", "az z" # الظ
272
- sub boundary + "\u0627\u0644\u0644", "al l" # الل
273
- sub boundary + "\u0627\u0644\u0646", "an n" # الن
260
+ sub boundary + "\u0627\u0644\u062a" + maybe("\u0651"), "at t" # الت
261
+ sub boundary + "\u0627\u0644\u062b" + maybe("\u0651"), "as s" # الث
262
+ sub boundary + "\u0627\u0644\u062f" + maybe("\u0651"), "ad d" # الد
263
+ sub boundary + "\u0627\u0644\u0630" + maybe("\u0651"), "az z" # الذ
264
+ sub boundary + "\u0627\u0644\u0631" + maybe("\u0651"), "ar r" # الر
265
+ sub boundary + "\u0627\u0644\u0632" + maybe("\u0651"), "az z" # الز
266
+ sub boundary + "\u0627\u0644\u0633" + maybe("\u0651"), "as s" # الس
267
+ sub boundary + "\u0627\u0644\u0634" + maybe("\u0651"), "ash sh" # الش
268
+ sub boundary + "\u0627\u0644\u0635" + maybe("\u0651"), "as s" # الص
269
+ sub boundary + "\u0627\u0644\u0636" + maybe("\u0651"), "az z" # الض
270
+ sub boundary + "\u0627\u0644\u0637" + maybe("\u0651"), "at t" # الط
271
+ sub boundary + "\u0627\u0644\u0638" + maybe("\u0651"), "az z" # الظ
272
+ sub boundary + "\u0627\u0644\u0644" + maybe("\u0651"), "al l" # الل
273
+ sub boundary + "\u0627\u0644\u0646" + maybe("\u0651"), "an n" # الن
274
274
 
275
275
  # Farsi Vowel (Pointing)
276
276
  sub "\u0622", "a" # آ alef maddeh
@@ -4,12 +4,12 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: IC STANDARDS FOR TRANSLITERATION OF HINDI AND URDU PERSONAL NAMES
7
+ name: Intelligence Community (IC) Standard for the Transliteration of Hindi and Urdu Personal Names (2004)
8
8
  url: https://github.com/interscript/interscript-private-references/blob/master/odni/Hindi_and_Urdu_IC_Standard.doc
9
9
  creation_date: 2004
10
10
  description: |
11
11
  IC STANDARDS FOR TRANSLITERATION OF HINDI AND URDU PERSONAL NAMES
12
-
12
+
13
13
  notes:
14
14
  - |
15
15
  Long/Short Vowels: Long and short vowels are not distinguished in the system:
@@ -69,7 +69,7 @@ stage {
69
69
 
70
70
  # CHARACTERS
71
71
  parallel {
72
-
72
+
73
73
  #Independent vowel characters
74
74
  sub "अ", "a"
75
75
  sub "आ", "a"
@@ -84,7 +84,7 @@ stage {
84
84
  sub "ओ", "o"
85
85
  sub "ऑ", "au"
86
86
  sub "औ", "au"
87
-
87
+
88
88
  #Dependent Vowels
89
89
  sub "ा", "a"
90
90
  sub "ि", "i"
@@ -98,10 +98,10 @@ stage {
98
98
  sub "ो", "o"
99
99
  sub "ौ", "au"
100
100
  sub "ॉ", "au"
101
-
102
-
101
+
102
+
103
103
  # Consonants
104
-
104
+
105
105
  # Gutturals
106
106
  sub "क", "k"
107
107
  sub "क्ष", "ksha"
@@ -112,7 +112,7 @@ stage {
112
112
  sub "ग़", "gh"
113
113
  sub "घ", "gh"
114
114
  sub "ङ", "n"
115
-
115
+
116
116
  # Palatals
117
117
  sub "च", "ch"
118
118
  sub "छ", "ch"
@@ -121,7 +121,7 @@ stage {
121
121
  sub "झ", "gya"
122
122
  sub "झ", "jh"
123
123
  sub "ञ", "n"
124
-
124
+
125
125
  # Cerebrals
126
126
  sub "ट", "t"
127
127
  sub "ठ", "th"
@@ -130,14 +130,14 @@ stage {
130
130
  sub "ढ़", "rh"
131
131
  sub "ढ", "dh"
132
132
  sub "ण", "n"
133
-
133
+
134
134
  # Dentals
135
135
  sub "त", "t"
136
136
  sub "थ", "th"
137
137
  sub "द", "d"
138
138
  sub "ध", "dh"
139
139
  sub "न", "n"
140
-
140
+
141
141
  # Labials
142
142
  sub "प", "p"
143
143
  sub "फ़", "f"
@@ -145,34 +145,34 @@ stage {
145
145
  sub "ब", "b"
146
146
  sub "भ", "bh"
147
147
  sub "म", "m"
148
-
148
+
149
149
  # Semivowels
150
150
  sub "य", "y"
151
151
  sub "र", "r"
152
152
  sub "ल", "l"
153
153
  sub "व", "v"
154
-
154
+
155
155
  # Sibilants
156
156
  sub "श", "sh"
157
157
  sub "ष", "sh"
158
158
  sub "स", "s"
159
-
160
-
159
+
160
+
161
161
  # Aspirate
162
162
  sub "ह", "h"
163
-
163
+
164
164
  # Anusvāra
165
165
  sub "ं", "n"
166
-
166
+
167
167
  # Anunāsika
168
168
  sub "ँ", "n"
169
-
169
+
170
170
  # halanta
171
171
  sub "्", ""
172
-
172
+
173
173
  # bisharga
174
174
  sub "ः", "h"
175
-
175
+
176
176
  sub "़", ""
177
177
  }
178
178
 
@@ -4,8 +4,7 @@ metadata {
4
4
  language: iso-639-2:hin
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: Office of the Director Of National Intelligence Hindi Urdu Personal Names 2015 System, ICS-630-01 Annex F
8
-
7
+ name: Romanization of Hindi Urdu Personal Names (2015), ICS-630-01 Annex F
9
8
  #url:
10
9
  creation_date: 2015
11
10
  confirmation_date: 2015
@@ -16,7 +15,7 @@ metadata {
16
15
  forensic information. Rather, it is to provide an IC standard Romanized (English)
17
16
  transliteration from standard Hindi and Urdu that can then be linked to forensic
18
17
  information in ways that will help identify the referent of the name.
19
-
18
+
20
19
  There are typically a number of ways that names can be Romanized from either
21
20
  Devanagari (Hindi) or modified Arabic (Urdu) scripts. Ambiguities can result from the
22
21
  Romanization of Hindi and Urdu names for several reasons, including the fact that some
@@ -31,7 +30,7 @@ metadata {
31
30
  And, as in the Arabic source, names containing the Arabic definite article ‘al’ (‘ul’) show
32
31
  anticipatory assimilation in pronunciation (e.g., Shams al Din > Shamsuddin);
33
32
  transliterations may either reflect spelling or pronunciation in such cases.
34
-
33
+
35
34
  Because Hindi and Urdu overlap so extensively, it is desirable to correlate Hindi and
36
35
  Urdu transliterations as much as possible. In the area of names, this can become
37
36
  problematic when the Urdu spelling accurately reflects original Arabic spelling while the
@@ -40,7 +39,7 @@ metadata {
40
39
  either Urdu or Hindi (e.g., letter sin versus letter sad) while maintaining Arabic/Urdu
41
40
  spelling distinctions like Hindi also maintains (e.g., qaf as in Qutubbin versus kaf)).
42
41
  However, this is not always possible (see Hindi va versus Urdu wau).
43
-
42
+
44
43
  In cases where an individual’s name has already been transliterated, that is to be indicated
45
44
  – as found – in parentheses immediately following its rendition in the transliteration
46
45
  standard (e.g., Muhammad Khulud (Mohamed Khulood)). In addition, if the original
@@ -48,14 +47,14 @@ metadata {
48
47
  parentheses following the name, if possible, following best practices of the issuing
49
48
  organization and taking into consideration information system capabilities. This
50
49
  convention is designed to ensure that vital forensic information is not lost.
51
-
50
+
52
51
  For names of persons who are known to not be part of the Hindi- or Urdu-speaking
53
52
  community, use the relevant IC transliteration standard for names from that language
54
53
  (e.g., Mikhail, Yitzhak). A translator’s note may be used to clarify the known origin of
55
54
  the person. Spell names of individuals from languages that are written in Roman letters as
56
55
  they are spelled in those languages (e.g., George Clooney, Jorge Garcia, Georges
57
56
  Pompidou).
58
-
57
+
59
58
  In the case of active senior government officials in the on-line CIA World Factbook and
60
59
  the on-line directory of Chiefs of State and Cabinet Members of Foreign Governments,
61
60
  the spellings given in these on-line reference works should be used in place of the IC
@@ -64,7 +63,7 @@ metadata {
64
63
  government official), the IC Standard spelling should appear first, with the spelling, if
65
64
  known, as it previously appeared in those resources listed within parentheses at the first
66
65
  usage.
67
-
66
+
68
67
  The primary goal of this system is to produce a consistent Romanized transcription of the
69
68
  name that is readable to the non-specialist. The system uses the 26 letters of the standard
70
69
  (English) Roman alphabet. Some ambiguities in the Romanized form will occur without
@@ -72,16 +71,16 @@ metadata {
72
71
  information about the individual is provided, the referent will be clearly identified.
73
72
  Additionally, this system will be used in conjunction with on-line tools, name dictionaries
74
73
  and lists containing conventional spellings of names of well-known individuals
75
-
74
+
76
75
  notes:
77
-
76
+
78
77
  - |
79
78
  Long/Short Vowels: Long and short vowels are not distinguished in the system:
80
79
  The borrowed Arabic name Samir could represent two distinct names, one with a
81
80
  long /a/ (Saamir) and one with a long /i/ (Samiir). One solution would be to use
82
81
  /ee/ to stand for the long /i/, as is often done (Sameer). The IC Standard will not
83
82
  distinguish between these.
84
-
83
+
85
84
  - |
86
85
  No distinction is made between: retroflex and non-retroflex consonants; and
87
86
  nasalized vowels and vowels followed by /n/.
@@ -151,9 +150,9 @@ stage {
151
150
 
152
151
  # CHARACTERS
153
152
  parallel {
154
-
153
+
155
154
  # I. Vowels and Diphthongs (see Note 1)
156
-
155
+
157
156
  sub "अ", "a"
158
157
  sub "आ", "a"
159
158
  sub "इ", "i"
@@ -165,7 +164,7 @@ stage {
165
164
  sub "ऐ", "ai"
166
165
  sub "ऑ", "o"
167
166
  sub "ओ", "au"
168
-
167
+
169
168
  # II. Consonants (see Note 2)
170
169
  # Gutturals
171
170
  sub "क", "k"
@@ -177,7 +176,7 @@ stage {
177
176
  sub "घ", "gh"
178
177
  sub "ग़", "gh"
179
178
  sub "ङ", "n"
180
-
179
+
181
180
  # Palatals
182
181
  sub "च", "ch"
183
182
  sub "छ", "ch"
@@ -185,7 +184,7 @@ stage {
185
184
  sub "झ", "jh"
186
185
  sub "ज़", "z"
187
186
  sub "ञ", "n"
188
-
187
+
189
188
  # Cerebrals
190
189
  sub "ट", "t"
191
190
  sub "ठ", "th"
@@ -194,14 +193,14 @@ stage {
194
193
  sub "ढ", "dh"
195
194
  sub "ढ़", "rh"
196
195
  sub "ण", "n"
197
-
196
+
198
197
  # Dentals
199
198
  sub "त", "t"
200
199
  sub "थ", "th"
201
200
  sub "द", "d"
202
201
  sub "ध", "dh"
203
202
  sub "न", "n"
204
-
203
+
205
204
  # Labials
206
205
  sub "प", "p"
207
206
  sub "फ", "ph"
@@ -209,33 +208,33 @@ stage {
209
208
  sub "ब", "b"
210
209
  sub "भ", "bh"
211
210
  sub "म", "m"
212
-
211
+
213
212
  # Semivowels
214
213
  sub "य", "y"
215
214
  sub "र", "r"
216
215
  sub "ल", "l"
217
216
  sub "व", "v"
218
-
217
+
219
218
  # Sibilants
220
219
  sub "श", "sh"
221
220
  sub "ष", "sh"
222
221
  sub "स", "s"
223
-
222
+
224
223
  # Aspirate
225
224
  sub "ह", "h"
226
-
225
+
227
226
  # Anusvāra
228
227
  sub "ं", "n"
229
-
228
+
230
229
  # Bisarga
231
230
  sub "ः ", "h"
232
-
231
+
233
232
  # Anunāsika
234
233
  sub "ँ", "n"
235
-
234
+
236
235
  sub "़", ""
237
236
  sub "्", ""
238
-
237
+
239
238
  # Medials # Needed for connecting constants
240
239
  sub "ा", "a"
241
240
  sub "ि", "i"