interscript-maps 2.0.5
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
|
@@ -0,0 +1,327 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: bgnpcgn
|
|
3
|
+
id: 2007
|
|
4
|
+
language: iso-639-3:prs
|
|
5
|
+
source_script: Arab
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: ODNI Pashto Personal Names 2011 System
|
|
8
|
+
url: https://github.com/interscript/interscript-private-references/blob/master/odni/Pashto%20June%202011.pdf
|
|
9
|
+
creation_date: 2011
|
|
10
|
+
confirmation_date: 2011-06
|
|
11
|
+
description: |
|
|
12
|
+
Pashto is a language characterized by its variability. The
|
|
13
|
+
challenges of reaching a universally acceptable
|
|
14
|
+
transliteration standard for personal names are posed both
|
|
15
|
+
by the dialect spread trending roughly from the southwest
|
|
16
|
+
to the northeast parts of its geographic area, and also by
|
|
17
|
+
the competing influences of Dari and Urdu. Given the lack
|
|
18
|
+
of any dominant standard on some points, it has been
|
|
19
|
+
considered necessary to define a certain degree of
|
|
20
|
+
flexibility within this standardization system in order to
|
|
21
|
+
enable it to capture the variability of the language it
|
|
22
|
+
seeks to reflect. A great effort has also been made to
|
|
23
|
+
research and reflect common usage in the Pashto- speaking
|
|
24
|
+
areas of Pakistan and Afghanistan, and to define rules
|
|
25
|
+
which capture these trends to the best extent possible.
|
|
26
|
+
However, a respect for the norms of usage has also been
|
|
27
|
+
balanced with the need for consistency and intelligibility.
|
|
28
|
+
Therefore, there are cases where a less common spelling
|
|
29
|
+
will be the preferred usage under the guidance of this
|
|
30
|
+
system. Lastly, specific names that cannot be incorporated
|
|
31
|
+
gracefully into the rules described below are included with
|
|
32
|
+
case-by-case preferred spellings in a list near the end of
|
|
33
|
+
this document.
|
|
34
|
+
|
|
35
|
+
notes:
|
|
36
|
+
# Special rules: Consonants
|
|
37
|
+
- Pashto letter ge (ږ) The two common renderings for this
|
|
38
|
+
letter are 'zh' and 'g.' 1 The preferred option will be
|
|
39
|
+
'zh' (consistent with the choice of southern 'sh' for )ښ.
|
|
40
|
+
However, when referring to communities that consistently
|
|
41
|
+
render the name with a 'g' as opposed to a 'zh,' then 'g'
|
|
42
|
+
will be the preferred option. In these cases, the inclusion
|
|
43
|
+
of a variant spelling with 'zh' is strongly encouraged.
|
|
44
|
+
|
|
45
|
+
- Double consonants Double consonants represented by the
|
|
46
|
+
tashdid (shaddah) are shown in most cases regardless of
|
|
47
|
+
whether they are clearly enunciated in speech. Examples
|
|
48
|
+
Muhammad Hassan, Izzatullah. However, consonants
|
|
49
|
+
represented by digraphs are not doubled. Example Mubashir (
|
|
50
|
+
not Mubashshir). Special care should be taken when
|
|
51
|
+
possible to discriminate between doubled and
|
|
52
|
+
non-doubled letters in names that are otherwise
|
|
53
|
+
indistinguishable in their transliterated forms
|
|
54
|
+
Hasan (حسن (vs. Hassan (حسان(
|
|
55
|
+
|
|
56
|
+
- Digraphs No distinction is made between digraphs such as 'sh'
|
|
57
|
+
and single contiguous letters such as 's' followed by 'h.'
|
|
58
|
+
|
|
59
|
+
# Special rules: Vowels
|
|
60
|
+
- Short vowels zair and pesh The preferred options for the
|
|
61
|
+
short vowels represented by the zair and pesh will be 'i'
|
|
62
|
+
and 'u.' However, in cases where there is a mixed Dari and
|
|
63
|
+
Pashto environment, then the use of 'e' and 'o' is accepted
|
|
64
|
+
in consideration of Dari norms.
|
|
65
|
+
|
|
66
|
+
- Long/short vowels Long and short vowels are not
|
|
67
|
+
distinguished in the system (with the exception of
|
|
68
|
+
certain spellings driven by Dari influence as discussed
|
|
69
|
+
above). In this and other systems, the borrowed
|
|
70
|
+
Arabic name Salim could represent two distinct names, one
|
|
71
|
+
with a long /a/ (Saalim - )سالم and one with a
|
|
72
|
+
long /i/ (Saliim - )سلیم. This is known as a collision.
|
|
73
|
+
This and many other prevailing standardization
|
|
74
|
+
systems do not distinguish between these types of
|
|
75
|
+
collisions. However, in cases like these, it is
|
|
76
|
+
recommended that a vigorous effort be made to include
|
|
77
|
+
variant spellings in order to eliminate ambiguity
|
|
78
|
+
as to which name is intended, as in the following examples
|
|
79
|
+
Hamid (var. Hameed) – حمید
|
|
80
|
+
Hamid (var. Hamed) – حامد
|
|
81
|
+
|
|
82
|
+
- Izafat The linking vowel of Persian origin known as the
|
|
83
|
+
izafat will be written with a hyphen and then 'e'
|
|
84
|
+
and then a following space. Example Koh-e Nur ("mountain
|
|
85
|
+
of light"). There will be no special
|
|
86
|
+
accommodation for when the initial word ends in a vowel.
|
|
87
|
+
|
|
88
|
+
# Special rules: Arabic
|
|
89
|
+
- The Arabic article al ( ال ) The Arabic article will be
|
|
90
|
+
written with a lowercase 'a' and followed by a hyphen, with
|
|
91
|
+
the obvious exception that an uppercase 'a' should be used
|
|
92
|
+
where required by English orthographic conventions, e.g.,
|
|
93
|
+
at the beginning of a sentence. Example Karim al-Afghani
|
|
94
|
+
|
|
95
|
+
- Genitive constructions Multi-part Arabic names that follow
|
|
96
|
+
the Arabic genitive construction will be written with a
|
|
97
|
+
lowercase ul joined to the last part of the name by a
|
|
98
|
+
hyphen. Arabic sun letter assimilation generally will not
|
|
99
|
+
be shown.
|
|
100
|
+
# Genitive construction exceptions
|
|
101
|
+
- In deference to widespread usage, the name Abd will be
|
|
102
|
+
combined with the genitive article ul,
|
|
103
|
+
and the rest of the name will be written separately (
|
|
104
|
+
specifically, one of the ninety-nine
|
|
105
|
+
"names of God"). Examples Abdul Haq, Abdul Rahman
|
|
106
|
+
- Names incorporating "--ullah" will be written as a single
|
|
107
|
+
unit. Examples Abdullah, Rahmatullah
|
|
108
|
+
- Names incorporating "--din" will be written as a single
|
|
109
|
+
unit with sun letter assimilation
|
|
110
|
+
shown, causing ul to change to ud. This type of name is the
|
|
111
|
+
only case in which sun letter assimilation will be shown.
|
|
112
|
+
Examples Jamaluddin, Shamsuddin
|
|
113
|
+
- Note, no effort will be made to force names into the
|
|
114
|
+
genitive construction if they are not
|
|
115
|
+
linked by the article. For example, both names Fazl ul-
|
|
116
|
+
Rahman and Fazl Rahman would be
|
|
117
|
+
acceptable, depending on whether the article was included
|
|
118
|
+
in the individual's name.
|
|
119
|
+
|
|
120
|
+
- Consonant clusters Traditional Arabic names ending in a
|
|
121
|
+
final consonant cluster will be spelled with the
|
|
122
|
+
consonant cluster intact. Although most native Pashto
|
|
123
|
+
speakers will break up the cluster in conversational
|
|
124
|
+
speech, general usage in the written transliteration of
|
|
125
|
+
names still favors the preservation of the consonant
|
|
126
|
+
cluster in print.
|
|
127
|
+
This type of name should not be confused with Arabic names whose orthography includes a zabar (short
|
|
128
|
+
'a' vowel) prior to the final consonant. -- NOT DONE
|
|
129
|
+
|
|
130
|
+
# Special rules: Multiple-part Pashto names
|
|
131
|
+
- TODO
|
|
132
|
+
|
|
133
|
+
# Special rules: Glides versus consonants
|
|
134
|
+
- The unwritten phonetic "glides," also known as semi-
|
|
135
|
+
consonants (sounding similar to /y/ and /w/), will
|
|
136
|
+
generally not be shown between two vowels.
|
|
137
|
+
Examples Rauf, Said (سعيد)
|
|
138
|
+
|
|
139
|
+
- Care should be taken to distinguish the above rule from
|
|
140
|
+
cases in which wao or ya are a written part of the name and
|
|
141
|
+
function as true consonants, including cases where they are
|
|
142
|
+
doubled. Examples Fayiz ( فایز ), Fayyaz ( فیّاض )
|
|
143
|
+
|
|
144
|
+
- A common form where ya will be shown in its role as a
|
|
145
|
+
consonant is with the Arabic nisba (suffix showing origin,
|
|
146
|
+
relation, etc.) appended to names that end in a vowel.
|
|
147
|
+
Examples Ziayi, Shafiyi, Mirzayi, Paktiayi
|
|
148
|
+
|
|
149
|
+
# Specific rules: Exceptions
|
|
150
|
+
- TODO
|
|
151
|
+
In spite of best intentions, the unbending application of
|
|
152
|
+
rules in any transliteration system is likely to produce
|
|
153
|
+
some forms that fly in the face of accepted use. Therefore,
|
|
154
|
+
the following names will be spelled as follows, in spite of
|
|
155
|
+
minor variance with the rules described above.
|
|
156
|
+
Aurangzeb (not Awrangzeb)
|
|
157
|
+
Eid (not Id)
|
|
158
|
+
Faizad (not Faizzad)
|
|
159
|
+
Javed (not Jawed) 2
|
|
160
|
+
Parvez (not Parwez)
|
|
161
|
+
Qureshi (not Quraishi)
|
|
162
|
+
Saad (not Sad)
|
|
163
|
+
Sherpao (not Sherpaw)
|
|
164
|
+
|
|
165
|
+
- The following names do not constitute exceptions to the
|
|
166
|
+
rules of this standard, but they are names that pose
|
|
167
|
+
significant challenges to standardization and are therefore
|
|
168
|
+
listed here to ensure consensus
|
|
169
|
+
Bahadur (not Bahadar, Bahader)
|
|
170
|
+
Feroz (not Firoz, Fairuz, etc.)
|
|
171
|
+
Firdaws (not Firdos)
|
|
172
|
+
Husain (not Hussain)
|
|
173
|
+
Isfandyar (not Asfandyar)
|
|
174
|
+
Ismail (not Ismael)
|
|
175
|
+
Khushhal (not Khushal)
|
|
176
|
+
Niamat (not Nimat)
|
|
177
|
+
Numan (not Nauman)
|
|
178
|
+
Raza (not Reza)
|
|
179
|
+
Sherzad (not Shirzad)
|
|
180
|
+
Tor Jan (not Tur Jan)
|
|
181
|
+
Uwais (not Awais)
|
|
182
|
+
|
|
183
|
+
# Special rules: Titles
|
|
184
|
+
- We treat the spelling of commonly used titles differently
|
|
185
|
+
from the handling of names, given that titles are subject
|
|
186
|
+
to norms of English as they are accepted into the English
|
|
187
|
+
language. Though not specifically covered by the scope of
|
|
188
|
+
this transliteration standard, the following spellings are
|
|
189
|
+
recommended for the sake of consistency
|
|
190
|
+
Akhund
|
|
191
|
+
Amir
|
|
192
|
+
Commander (not Commandan)
|
|
193
|
+
Hafiz
|
|
194
|
+
Haji
|
|
195
|
+
Mawlana
|
|
196
|
+
Mawlawi
|
|
197
|
+
Mullah
|
|
198
|
+
Qari
|
|
199
|
+
Qazi
|
|
200
|
+
Sahib
|
|
201
|
+
Sheikh
|
|
202
|
+
Syed ( سیّد )
|
|
203
|
+
Ustad
|
|
204
|
+
}
|
|
205
|
+
|
|
206
|
+
tests {
|
|
207
|
+
test "حَسّان", "Hassan"
|
|
208
|
+
test "حَسَن", "Hasan"
|
|
209
|
+
test "صَفّار", "Saffar"
|
|
210
|
+
test "صَفَر", "Safar"
|
|
211
|
+
# collision
|
|
212
|
+
test "حَمِيد", "Hamid"
|
|
213
|
+
# collision
|
|
214
|
+
test "حامِد", "Hamid"
|
|
215
|
+
test "كَرِيم الأَفغَانِي", "Karim al-Afghani"
|
|
216
|
+
test "عَبداللَّه", "Abdullah"
|
|
217
|
+
test "جَمَال الدين", "Jamaluddin"
|
|
218
|
+
test "شَمسُ الدين", "Shamsuddin"
|
|
219
|
+
test "فَيَّاض", "Fayyaz"
|
|
220
|
+
test "فايِز", "Fayiz"
|
|
221
|
+
test "ا", "A"
|
|
222
|
+
test "رَؤوف", "Rauf"
|
|
223
|
+
test "سَعِيد", "Said"
|
|
224
|
+
test "قَيُّوم", "Qayyum"
|
|
225
|
+
}
|
|
226
|
+
|
|
227
|
+
stage {
|
|
228
|
+
# CHARACTERS
|
|
229
|
+
parallel {
|
|
230
|
+
|
|
231
|
+
sub "\u0650", "i" # ِ kasra
|
|
232
|
+
sub "\u064f", "u" # ُ damma
|
|
233
|
+
|
|
234
|
+
sub "\u0650" + boundary, "-e" # ِ kasra
|
|
235
|
+
|
|
236
|
+
sub "\u0652", "" # ْ sokoon
|
|
237
|
+
sub "\u0659", "ê"
|
|
238
|
+
|
|
239
|
+
# Sun letters
|
|
240
|
+
sub maybe("\u064f") + maybe(space) + "\u0627\u0644\u062f" + any("\u064a\u0649") + "\u0646", "uddin" # الدين
|
|
241
|
+
|
|
242
|
+
sub "\u0626", "êy" # ئ
|
|
243
|
+
|
|
244
|
+
sub "\u0628", "b" # ب
|
|
245
|
+
sub "\u067E", "p" # پ
|
|
246
|
+
sub any("\u062a\u067C\u0637"), "t" # ت/ټ/ط
|
|
247
|
+
sub "\u062c", "j" # ج
|
|
248
|
+
sub "\u0686", "ch" # چ
|
|
249
|
+
sub "\u0681", "dz" # ځ
|
|
250
|
+
sub "\u0685", "ts" # څ
|
|
251
|
+
sub any("\u062d\u0647"), "h" # ح/ه
|
|
252
|
+
sub "\u062e", "kh" # خ
|
|
253
|
+
sub any("\u062f\u0689"), "d" # د/ډ
|
|
254
|
+
sub any("\u0631\u0693"), "r" # ر/ړ
|
|
255
|
+
sub any("\u0630\u0632\u0636\u0638"), "z" # ذ/ز/ض/ظ
|
|
256
|
+
sub any("\u0696\u0698"), "zh" # ژ/ږ
|
|
257
|
+
sub any("\u062B\u0633\u0635"), "s" # س/ث/ص
|
|
258
|
+
sub any("\u0634\u069A"), "sh" # ښ/ش
|
|
259
|
+
sub any("\u0621\u0639"), "" # ع/ء
|
|
260
|
+
sub "\u063a", "gh" # غ
|
|
261
|
+
sub "\u0641", "f" # ف
|
|
262
|
+
sub "\u0642", "q" # ق
|
|
263
|
+
sub "\u0643", "k" # ك
|
|
264
|
+
sub "\u06A9", "k" # ک
|
|
265
|
+
sub any("\u06AF\u06AB"), "g" # گ/ګ
|
|
266
|
+
|
|
267
|
+
sub "\u0644", "l" # ل
|
|
268
|
+
sub "\u0645", "m" # م
|
|
269
|
+
sub any("\u0646\u06BC"), "n" # ن/ڼ
|
|
270
|
+
sub "\u0648", "w" # و
|
|
271
|
+
sub "\u064a", "y" # ي
|
|
272
|
+
sub "\u0649", "y" # ي
|
|
273
|
+
|
|
274
|
+
sub "\u064e" + maybe("\u0627"), "a" # َ fatha
|
|
275
|
+
sub "\u0650", any("ie")
|
|
276
|
+
sub "\u064f", any("uo") # ُ damma
|
|
277
|
+
sub "\u0622", "a" # آ
|
|
278
|
+
sub "\u0627", "a" # ا
|
|
279
|
+
sub "\u0648", "o" # و
|
|
280
|
+
sub "\u064e\u0648\u0652", "aw" # ـَوْ
|
|
281
|
+
sub "\u064f\u0648", "u" # ـُو
|
|
282
|
+
sub "\u064e\u064a", "ai" # ـي
|
|
283
|
+
sub "\u0650" + any("\u064a\u0649"), "i"
|
|
284
|
+
sub "\u06D0", "e" # ې
|
|
285
|
+
sub "\u06CD", "ey" # ۍ
|
|
286
|
+
sub "\u06CC", "a" # ی
|
|
287
|
+
sub "\u064e\u06CC" + any("\u0647\u0627"), "aya" # َيا / َيه
|
|
288
|
+
sub "\u0650\u06CC" + any("\u0647\u0627"), "ia" # ِيا /ِيه
|
|
289
|
+
sub "\u0652\u06CC\u0627", "ya" # ْيا
|
|
290
|
+
sub any("\u06D0\u06D2") + boundary, "ey" # ے / ې
|
|
291
|
+
sub "\u0648\u064A" + boundary, "oy" # وي
|
|
292
|
+
sub "\u064f\u0648\u064A" + boundary, "uy" # ُوي
|
|
293
|
+
sub "\u0623", "" # أ
|
|
294
|
+
|
|
295
|
+
# Double consonants
|
|
296
|
+
sub "\u0628\u0651", "bb" # ب
|
|
297
|
+
sub "\u067E\u0651", "pp" # پ
|
|
298
|
+
sub any("\u062a\u067C\u0637") + "\u0651", "tt" # ت/ټ/ط
|
|
299
|
+
sub "\u062c\u0651", "jj" # ج
|
|
300
|
+
sub any("\u062d\u0647") + "\u0651", "hh" # ح/ه
|
|
301
|
+
sub any("\u062f\u0689") + "\u0651", "dd" # د/ډ
|
|
302
|
+
sub any("\u0631\u0693") + "\u0651", "rr" # ر/ړ
|
|
303
|
+
sub any("\u0630\u0632\u0636\u0638") + "\u0651", "zz" # ذ/ز/ض/ظ
|
|
304
|
+
sub any("\u062B\u0633\u0635") + "\u0651", "ss" # س/ث/ص
|
|
305
|
+
sub "\u0641\u0651", "ff" # ف
|
|
306
|
+
sub "\u0642\u0651", "qq" # ق
|
|
307
|
+
sub "\u0643\u0651", "kk" # ك
|
|
308
|
+
sub "\u06A9\u0651", "kk" # ک
|
|
309
|
+
sub any("\u06AF\u06AB") + "\u0651", "gg" # گ/ګ
|
|
310
|
+
sub "\u0644\u0651", "ll" # ل
|
|
311
|
+
sub "\u0645\u0651", "mm" # م
|
|
312
|
+
sub any("\u0646\u06BC") + "\u0651", "nn" # ن/ڼ
|
|
313
|
+
sub "\u0648\u0651", "ww" # و
|
|
314
|
+
sub "\u064a\u0651", "yy" # ي
|
|
315
|
+
sub "\u0649\u0651", "yy" # ي
|
|
316
|
+
|
|
317
|
+
sub boundary + "\u0627\u0644", "al-", before: space # ال
|
|
318
|
+
sub maybe(space) + "\u0627\u0644\u0644\u0651\u064e\u0647", "ullah"
|
|
319
|
+
|
|
320
|
+
sub "\u0624\u0648", "u"
|
|
321
|
+
}
|
|
322
|
+
|
|
323
|
+
# POSTRULES
|
|
324
|
+
sub any("\u0061".."\uFFFF"), upcase, before: boundary, not_before: boundary + any("‘’'")
|
|
325
|
+
# don't capitalize defined article in the middle of a sentence
|
|
326
|
+
sub " Al-", " al-" # الن
|
|
327
|
+
}
|
|
@@ -0,0 +1,79 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: odni
|
|
3
|
+
id: 2015
|
|
4
|
+
language: iso-639-2:rus
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Office of the Director Of National Intelligence Russian Personal Names 2015, ICS-630-01 Annex K
|
|
8
|
+
|
|
9
|
+
# url:
|
|
10
|
+
source: ICS-630-01 Annex K
|
|
11
|
+
creation_date: 2015
|
|
12
|
+
confirmation_date: 2015
|
|
13
|
+
description: |
|
|
14
|
+
This system, adapted from the Board of Geographic Names (BGN) Romanization system for Russian
|
|
15
|
+
(1947), is the Intelligence Community (IC) standard for the transliteration of Russian names that will be
|
|
16
|
+
applied to all final written reports and products for IC consumers. It is not intended to eliminate variations
|
|
17
|
+
of a name that can contribute forensic information. Rather, it is to provide an IC standard Romanized
|
|
18
|
+
(English) transliteration from Russian that can then be linked to forensic information in ways that will
|
|
19
|
+
help identify the referent of the name.
|
|
20
|
+
|
|
21
|
+
In cases where an individual’s name has already been transliterated in a variant spelling, the IC Standard
|
|
22
|
+
spelling should appear first, followed by the variant spelling(s) in parentheses at the first usage. E.g.,
|
|
23
|
+
Sergey Nikolayevich Tyurin (Serguei Nicolaivitch Tiourine). In addition, if the original Cyrillic spelling
|
|
24
|
+
is known, that spelling should also appear in parentheses following the name, if possible, following best
|
|
25
|
+
practices of the issuing organization and taking into consideration information system capabilities. This
|
|
26
|
+
convention is designed to ensure that vital forensic information is not lost.
|
|
27
|
+
|
|
28
|
+
For non-Russian names, use the relevant IC transliteration standard for names from that language. A
|
|
29
|
+
translator’s note may be used to clarify the known origin of the person. Spell names of individuals from
|
|
30
|
+
languages that are written in Roman letters as they are spelled in those languages (e.g., George Clooney,
|
|
31
|
+
Jorge Garcia, Georges Pompidou).
|
|
32
|
+
|
|
33
|
+
In the case of active senior government officials in the on-line CIA World Factbook and the on-line
|
|
34
|
+
directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings given in these
|
|
35
|
+
on-line reference works should be used in place of the IC Standard. For any individual who has at one
|
|
36
|
+
time been listed in the Factbook or Chiefs of State directory but who no longer appears in those resources
|
|
37
|
+
(i.e. is no longer a government official), the IC Standard spelling should appear first, with the spelling, if
|
|
38
|
+
known, as it previously appeared in those resources listed within parentheses at the first usage.
|
|
39
|
+
|
|
40
|
+
The primary goal is to produce a consistent Romanized transcription of names that is specifically readable
|
|
41
|
+
to the English-speaking non-specialist. The system uses the 26 letters of the standard (English) Roman
|
|
42
|
+
alphabet. Some ambiguities in the Romanized form will occur without the use of diacritics. However,
|
|
43
|
+
within the context of a report, where additional information about the individual is provided, the referent
|
|
44
|
+
will be clearly identified. This system will be used in conjunction with on-line tools, name dictionaries,
|
|
45
|
+
and lists containing conventional spellings of names of well-known individuals.
|
|
46
|
+
|
|
47
|
+
notes:
|
|
48
|
+
}
|
|
49
|
+
|
|
50
|
+
tests {
|
|
51
|
+
test "Ирина Ивановна Никитина", "Irina Ivanovna Nikitina"
|
|
52
|
+
test "Николай Римский-Корсаков", "Nikolay Rimskiy-Korsakov"
|
|
53
|
+
test "Михаил Тимофеевич Калашников", "Mikhail Timofeyevich Kalashnikov"
|
|
54
|
+
test "Корж Василий Захарович", "Korzh Vasiliy Zakharovich"
|
|
55
|
+
test "Циолковский Константин Эдуардович", "Tsiolkovskiy Konstantin Eduardovich"
|
|
56
|
+
test "Лобачевский Николай Иванович", "Lobachevskiy Nikolay Ivanovich"
|
|
57
|
+
test "Пушкин Александр Сергеевич", "Pushkin Aleksandr Sergeyevich"
|
|
58
|
+
test "Гоголь Николай Васильевич", "Gogol Nikolay Vasilyevich"
|
|
59
|
+
test "Ломоносов Михаил Васильевич", "Lomonosov Mikhail Vasilyevich"
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
dependency "bgnpcgn-rus-Cyrl-Latn-1947", as: cyrllatn
|
|
63
|
+
|
|
64
|
+
|
|
65
|
+
stage {
|
|
66
|
+
# CHARACTERS
|
|
67
|
+
#parallel {
|
|
68
|
+
# sub "\u042a", "" # Ъ
|
|
69
|
+
# sub "\u042c", "" # Ь
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
# sub "\u044a", "" # ъ
|
|
73
|
+
# sub "\u044c", "" # ь
|
|
74
|
+
#}
|
|
75
|
+
|
|
76
|
+
run map.cyrllatn.stage.main
|
|
77
|
+
|
|
78
|
+
sub "’", none
|
|
79
|
+
}
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: odni
|
|
3
|
+
id: 2005
|
|
4
|
+
language: iso-639-2:srp
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Office of the Director Of National Intelligence Serbian Personal Names 2004 System
|
|
8
|
+
creation_date: 2005
|
|
9
|
+
confirmation_date: 2005
|
|
10
|
+
description: |
|
|
11
|
+
Office of the Director Of National Intelligence Serbian Personal Names 2004 System
|
|
12
|
+
|
|
13
|
+
notes:
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
tests {
|
|
17
|
+
test "Гојко Митић", "Gojko Mitic"
|
|
18
|
+
test "Горња Ваганица", "Gornja Vaganica"
|
|
19
|
+
test "Довиђења", "Dovidjenja"
|
|
20
|
+
test "Ћао! Здраво!", "Cao! Zdravo!"
|
|
21
|
+
test "Кључ", "Kljuc"
|
|
22
|
+
test "Цигарете", "Cigarete"
|
|
23
|
+
test "Пролеће", "Prolece"
|
|
24
|
+
test "Понедељак", "Ponedeljak"
|
|
25
|
+
test "Горња Ваганица", "Gornja Vaganica"
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
dependency "odni-srp-Cyrl-Latn-2015", as: cyrllatn
|
|
29
|
+
|
|
30
|
+
stage {
|
|
31
|
+
|
|
32
|
+
run map.cyrllatn.stage.main
|
|
33
|
+
|
|
34
|
+
}
|
|
35
|
+
|
|
@@ -0,0 +1,130 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: odni
|
|
3
|
+
id: 2015
|
|
4
|
+
language: iso-639-2:srp
|
|
5
|
+
source_script: Cyrl
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Office of the Director Of National Intelligence Serbian Personal Names 2015, ICS-630-01 Annex L
|
|
8
|
+
|
|
9
|
+
# url:
|
|
10
|
+
source: ICS-630-01 Annex L
|
|
11
|
+
creation_date: 2015
|
|
12
|
+
confirmation_date: 2015
|
|
13
|
+
description: |
|
|
14
|
+
This system is the Intelligence Community (IC) standard for the transliteration of Serbian names
|
|
15
|
+
written in Cyrillic that will be applied to all final written reports and products for IC consumers. It
|
|
16
|
+
is not intended to eliminate variations of a name that can contribute forensic information. Rather,
|
|
17
|
+
it is to provide an IC standard Romanized (English) transliteration from Serbian that can then be
|
|
18
|
+
linked to forensic information in ways that will help identify the referent of the name.
|
|
19
|
+
|
|
20
|
+
In cases where an individual’s name has already been transliterated in a variant spelling, the IC
|
|
21
|
+
Standard spelling should appear first, followed by the variant spelling(s) in parentheses at the first
|
|
22
|
+
usage. In addition, if the original Cyrillic spelling is known, that spelling should also appear in
|
|
23
|
+
parentheses following the name, if possible, following best practices of the issuing organization
|
|
24
|
+
and taking into consideration information system capabilities. This convention is designed to
|
|
25
|
+
ensure that vital forensic information is not lost.
|
|
26
|
+
|
|
27
|
+
For names of persons who are known to not be part of the Serbian-speaking community, use the
|
|
28
|
+
relevant IC transliteration standard for names from that language (e.g., Mikhail, Yitzhak). A
|
|
29
|
+
translator’s note may be used to clarify the known origin of the person. Spell names of
|
|
30
|
+
individuals from languages that are written in Roman letters as they are spelled in those
|
|
31
|
+
languages (e.g., George Clooney, Jorge Garcia, Georges Pompidou).
|
|
32
|
+
|
|
33
|
+
In the case of active senior government officials in the on-line CIA World Factbook and the online directory of Chiefs of State and Cabinet Members of Foreign Governments, the spellings
|
|
34
|
+
given in these on-line reference works should be used in place of the IC Standard. For any
|
|
35
|
+
individual who has at one time been listed in the Factbook or Chiefs of State directory but who no
|
|
36
|
+
longer appears in those resources (i.e. is no longer a government official), the IC Standard
|
|
37
|
+
spelling should appear first, with the spelling, if known, as it previously appeared in those
|
|
38
|
+
resources listed within parentheses at the first usage.
|
|
39
|
+
|
|
40
|
+
The primary goal is to produce a consistent Romanized transcription of names that is specifically
|
|
41
|
+
readable to the English-speaking non-specialist. The system uses the 26 letters of the standard
|
|
42
|
+
(English) Roman alphabet. Some ambiguities in the Romanized form will occur without the use
|
|
43
|
+
of diacritics. However, within the context of a report, where additional information about the
|
|
44
|
+
individual is provided, the referent will be clearly identified. This system will be used in
|
|
45
|
+
conjunction with on-line tools, name dictionaries, and lists containing conventional spellings of
|
|
46
|
+
names of well-known individuals.
|
|
47
|
+
|
|
48
|
+
notes:
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
tests {
|
|
52
|
+
test "Гојко Митић", "Gojko Mitic"
|
|
53
|
+
test "Горња Ваганица", "Gornja Vaganica"
|
|
54
|
+
test "Довиђења", "Dovidjenja"
|
|
55
|
+
test "Ћао! Здраво!", "Cao! Zdravo!"
|
|
56
|
+
test "Кључ", "Kljuc"
|
|
57
|
+
test "Цигарете", "Cigarete"
|
|
58
|
+
test "Пролеће", "Prolece"
|
|
59
|
+
test "Понедељак", "Ponedeljak"
|
|
60
|
+
}
|
|
61
|
+
|
|
62
|
+
stage {
|
|
63
|
+
|
|
64
|
+
# CHARACTERS
|
|
65
|
+
parallel {
|
|
66
|
+
sub "\u0410", "A" # А
|
|
67
|
+
sub "\u0411", "B" # Б
|
|
68
|
+
sub "\u0412", "V" # В
|
|
69
|
+
sub "\u0413", "G" # Г
|
|
70
|
+
sub "\u0414", "D" # Д
|
|
71
|
+
sub "\u0402", "Dj" # Ђ
|
|
72
|
+
sub "\u0415", "E" # Е
|
|
73
|
+
sub "\u0416", "Z" # Ж
|
|
74
|
+
sub "\u0417", "Z" # З
|
|
75
|
+
sub "\u0418", "I" # И
|
|
76
|
+
sub "\u0408", "J" # Ј
|
|
77
|
+
sub "\u041A", "K" # К
|
|
78
|
+
sub "\u041B", "L" # Л
|
|
79
|
+
sub "\u0409", "Lj" # Љ
|
|
80
|
+
sub "\u041C", "M" # М
|
|
81
|
+
sub "\u041D", "N" # Н
|
|
82
|
+
sub "\u040A", "Nj" # Њ
|
|
83
|
+
sub "\u041E", "O" # О
|
|
84
|
+
sub "\u041F", "P" # П
|
|
85
|
+
sub "\u0420", "R" # Р
|
|
86
|
+
sub "\u0421", "S" # С
|
|
87
|
+
sub "\u0422", "T" # Т
|
|
88
|
+
sub "\u040B", "C" # Ћ
|
|
89
|
+
sub "\u0423", "U" # У
|
|
90
|
+
sub "\u0424", "F" # Ф
|
|
91
|
+
sub "\u0425", "H" # Х
|
|
92
|
+
sub "\u0426", "C" # Ц
|
|
93
|
+
sub "\u0427", "C" # Ч
|
|
94
|
+
sub "\u040F", "Dz" # Џ
|
|
95
|
+
sub "\u0428", "S" # Ш
|
|
96
|
+
|
|
97
|
+
sub "\u0430", "a" # а
|
|
98
|
+
sub "\u0431", "b" # б
|
|
99
|
+
sub "\u0432", "v" # в
|
|
100
|
+
sub "\u0433", "g" # г
|
|
101
|
+
sub "\u0434", "d" # д
|
|
102
|
+
sub "\u0452", "dj" # ђ
|
|
103
|
+
sub "\u0435", "e" # e
|
|
104
|
+
sub "\u0436", "z" # ж
|
|
105
|
+
sub "\u0437", "z" # з
|
|
106
|
+
sub "\u0438", "i" # и
|
|
107
|
+
sub "\u0458", "j" # ј
|
|
108
|
+
sub "\u043A", "k" # к
|
|
109
|
+
sub "\u043B", "l" # л
|
|
110
|
+
sub "\u0459", "lj" # љ
|
|
111
|
+
sub "\u043C", "m" # м
|
|
112
|
+
sub "\u043D", "n" # н
|
|
113
|
+
sub "\u045A", "nj" # њ
|
|
114
|
+
sub "\u043E", "o" # о
|
|
115
|
+
sub "\u043F", "p" # п
|
|
116
|
+
sub "\u0440", "r" # р
|
|
117
|
+
sub "\u0441", "s" # с
|
|
118
|
+
sub "\u0442", "t" # т
|
|
119
|
+
sub "\u045B", "c" # ћ
|
|
120
|
+
sub "\u0443", "u" # у
|
|
121
|
+
sub "\u0444", "f" # ф
|
|
122
|
+
sub "\u0445", "h" # х
|
|
123
|
+
sub "\u0446", "c" # ц
|
|
124
|
+
sub "\u0447", "c" # ч
|
|
125
|
+
sub "\u045F", "dz" # џ
|
|
126
|
+
sub "\u0448", "s" # ш
|
|
127
|
+
}
|
|
128
|
+
|
|
129
|
+
}
|
|
130
|
+
|