interscript 0.1.6 → 0.1.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/interscript.rb +10 -6
- data/lib/interscript/fs.rb +0 -2
- data/lib/interscript/mapping.rb +1 -1
- data/lib/interscript/opal.rb +38 -8
- data/lib/interscript/opal/entrypoint.rb +12 -0
- data/lib/interscript/opal/map_translate.rb +7 -0
- data/lib/interscript/version.rb +1 -1
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +5 -1
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +5 -1
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -1
- data/maps/alalc-asm-Deva-Latn-1997.yaml +9 -3
- data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ell-Grek-Latn-1997.yaml +5 -1
- data/maps/alalc-ell-Grek-Latn-2010.yaml +1 -2
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
- data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +1 -1
- data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
- data/maps/alalc-kor-Hang-Latn-1997.yaml +5 -1
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +21 -2
- data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
- data/maps/{alalc-pan-Deva-Latn-1997.yaml → alalc-pan-Guru-Latn-1997.yaml} +23 -4
- data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
- data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
- data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +1 -1
- data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
- data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -1
- data/maps/bgn-kor-Hang-Latn-1943.yaml +7 -3
- data/maps/bgn-kor-Kore-Latn-1943.yaml +3 -3
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +5 -1
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +5 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +2 -2
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +6 -2
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +5 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +5 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +5 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -1
- data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +1 -1
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +31 -1
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +1 -1
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +1 -1
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +1 -1
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +1 -1
- data/maps/{bis-gjr-Gujr-Latn-13194-1991.yaml → bis-guj-Gujr-Latn-13194-1991.yaml} +17 -2
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +1 -1
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +1 -1
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +1 -1
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +1 -1
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +1 -1
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +1 -1
- data/maps/by-bel-Cyrl-Latn-1998.yaml +5 -1
- data/maps/by-bel-Cyrl-Latn-2007.yaml +1 -1
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
- data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +15 -1
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +3 -3
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +2 -2
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -2
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -2
- data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -1
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +1 -1
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +7 -3
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -1
- data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -1
- data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +8 -4
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -4
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -3
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +1 -1
- data/maps/kp-kor-Hang-Latn-2002.yaml +25 -17
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +1 -1
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +2 -2
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +3 -3
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +2 -2
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +2 -2
- data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +2 -2
- data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
- data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +1 -1
- data/maps/odni-kat-Geor-Latn-2015.yaml +1 -1
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-urd-Arab-Latn-2015.yaml +1 -1
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1968.yaml +5 -1
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1999.yaml +5 -1
- data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +5 -1
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
- data/maps/{ungegn-amh-Ethi-Latn-2016.yaml → un-amh-Ethi-Latn-2016.yaml} +51 -24
- data/maps/un-ara-Arab-Latn-1971.yaml +1 -1
- data/maps/un-ara-Arab-Latn-1972.yaml +1 -1
- data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.yaml +1 -1
- data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
- data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +2 -2
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +2 -2
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -3
- data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
- data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +204 -17
- data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +35 -12
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
- data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +1 -1
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +2 -2
- data/maps/var-kor-Kore-Hang-2013.yaml +1 -1
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +1 -1
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
- data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
- data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
- data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
- data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +1 -1
- data/maps/var-tha-Thai-Zsym-ipa.yaml +1 -1
- data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +6 -2
- data/spec/interscript/filenames_spec.rb +384 -0
- data/spec/interscript_spec.rb +7 -4
- metadata +105 -26
- data/bin/interscript +0 -41
- data/bin/rspec +0 -29
- data/bin/setup +0 -8
- data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
- data/lib/interscript-opal.rb +0 -2
- data/lib/interscript/opal_map_translate.rb +0 -12
- data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
- data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
|
@@ -0,0 +1,71 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:sin
|
|
5
|
+
source_script: Sinh
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Sinhalese Romanization, 2011
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: sin_Sinh2Latn_ALA_2011
|
|
11
|
+
description: Sinhalese ALA-Library of Congress 2011 System
|
|
12
|
+
url: https://www.loc.gov/catdir/cpso/romanization/sinhales.pdf
|
|
13
|
+
creation_date: 2011
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Sinhalese
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
notes:
|
|
19
|
+
|
|
20
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
21
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
22
|
+
made in transliteration.
|
|
23
|
+
|
|
24
|
+
- |
|
|
25
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
26
|
+
transliteration, with the following exceptions:
|
|
27
|
+
|
|
28
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
29
|
+
b) when the absence of any vowel is indicated by the sign ් called virāma.
|
|
30
|
+
|
|
31
|
+
- |
|
|
32
|
+
Exceptions: Anusvāra is transliterated by:
|
|
33
|
+
|
|
34
|
+
a) ṅ before gutturals,
|
|
35
|
+
b) ñ before palatals,
|
|
36
|
+
c) ṇ before cerebrals,
|
|
37
|
+
d) n before dentals, and
|
|
38
|
+
e) m before labials.
|
|
39
|
+
|
|
40
|
+
- |
|
|
41
|
+
Exceptions:
|
|
42
|
+
a) when saññaka represents a nasal, it is romanized according to the rule for anusvāra.
|
|
43
|
+
b) when saññaka is combined with an aspirated consonant, the combination is romanized as a non-aspirated, followed by an aspirated consonant.
|
|
44
|
+
|
|
45
|
+
|
|
46
|
+
tests:
|
|
47
|
+
- source: "හිටපු අග්රාමාත්ය රනිල් වික්රමසිංහ අප්රේල් 21 ප්රහාරය සම්බන්ධයෙන් විමර්ශනය කරන ජනාධිපති පරීක්ෂණ කොමිසම හමුවේ දෙවෙනි දිනටත් සාක්ෂි ලබාදීමට පැමිණෙයි"
|
|
48
|
+
expected: "hiṭapu agrāmātya ranil vikramasiṃha aprēl 21 prahāraya sambanandhayen vimarśanaya karana janādhipati parīkṣaṇa komisama hamuvē deveni dinaṭat sākṣi labādīmaṭa pămiṇeyi"
|
|
49
|
+
- source: "පෑලියගොඩ මත්ස්ය තොග වෙළෙදපොළට පිවිසෙන පිවිසුම් මාර්ගය පුළුල් කර සංවර්ධනයට පියවර - මහාමාර්ග අමාත්ය ජොන්ස්ටන් ප්රනාන්දු"
|
|
50
|
+
expected: "pâliyagoḍa matsya toga veḷedapoḷaṭa pivisena pivisum māraṅgaya puḷul kara saṃvarandhanayaṭa piyavara - mahāmāraṅga amātya jonsaṇṭan pranānandu"
|
|
51
|
+
- source: "මව්බිමටත් රට වැසියන්ටත් ආශිර්වාද කරමින් විශේෂ ආගමික වැඩසටහන් මාලාවක්"
|
|
52
|
+
expected: "mavbimaṭat raṭa văsiyanaṇṭat āśirvāda karamin viśēṣa āgamika văḍasaṭahan mālāvak"
|
|
53
|
+
- source: "මිනුවන්ගොඩ කොරෝනා පොකුරින් තවත් ආසාදිතයින් 49 දෙනකු හඳුනා ගෙන"
|
|
54
|
+
expected: "minuvanaṅgoḍa korōnā pokurin tavat āsāditayin 49 denaku handunā gena"
|
|
55
|
+
- source: "ඉරණවිල වෙරළේ නාඳුනන ධීවර යාත්රා දෙකක්"
|
|
56
|
+
expected: "iraṇavila veraḷē nāndunana dhīvara yātarā dekak"
|
|
57
|
+
- source: "මඩකලපුව මංගලාරාමේ හාමුදුරුවන්ට මරණ තර්ජන - ආරක්ෂාවත් අඩුකරලා"
|
|
58
|
+
expected: "maḍakalapuva maṃgalārāmē hāmuduruvanaṇṭa maraṇa tarañjana - ārakṣāvat aḍukaralā"
|
|
59
|
+
- source: "හොරට කහ කුඩු හැදූ දෙදෙනෙක් බඩුත් එක්ක දැලේ"
|
|
60
|
+
expected: "horaṭa kaha kuḍu hădū dedenek baḍut ekaṅka dălē"
|
|
61
|
+
- source: "ඉංගිරියේ ජලභීතිකාව වැළඳුනු නරියෙකු තෙදිනක මෙහෙයුමකින් අල්ලා ගනී"
|
|
62
|
+
expected: "iṃgiriyē jalabhītikāva văḷandunu nariyeku tedinaka meheyumakin allā ganī"
|
|
63
|
+
- source: "බෞද්ධ දර්ශනයට අනුව අපි උපයන ධනය බුද්ධිමත් ලෙස විසර්ජනය කරන්නේ කෙසේ ද?"
|
|
64
|
+
expected: "baudandha darśanayaṭa anuva api upayana dhanaya budandhimat lesa visarañjanaya karanannē kesē da?"
|
|
65
|
+
- source: "ඉන්දීය ජාතිකයන් සමග එක්වන මන්නාරමේ ධීවරයන්ට අනතුරු අගවයි"
|
|
66
|
+
expected: "inandīya jātikayan samaga ekvana manannāramē dhīvarayanaṇṭa anaturu agavayi"
|
|
67
|
+
- source: "තේ නැවත වගාවට පෙර පස පුනරුත්ථාපනයට කෙටි මග"
|
|
68
|
+
expected: "tē năvata vagāvaṭa pera pasa punarutanthāpanayaṭa keṭi maga"
|
|
69
|
+
|
|
70
|
+
map:
|
|
71
|
+
inherit: 'alalc-sin-Sinh-Latn-1997'
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: alalc
|
|
3
3
|
id: 1997
|
|
4
|
-
language: srp
|
|
4
|
+
language: iso-639-2:srp
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: Serbian and Makedonian Romanization, ALA-LC 1997 System
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: srp_Cyrl2Latn_ALA_1997
|
|
11
|
+
description: Serbian and Macedonian ALA-Library of Congress 1997 System
|
|
8
12
|
url: http://catdir.loc.gov/catdir/cpso/romanization/serbian.pdf
|
|
9
13
|
creation_date: 1997
|
|
10
14
|
description: ALA-LC Romanization table for Serbian and Makedonian.
|
|
@@ -0,0 +1,62 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: iso-639-2:tam
|
|
5
|
+
source_script: Taml
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Tamil Romanization, 1997
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: tam_Taml2Latn_ALA_1997
|
|
11
|
+
description: Tamil ALA-Library of Congress 1997 System
|
|
12
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/tamil.pdf
|
|
13
|
+
creation_date: 1997
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Tamil
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
|
|
19
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
20
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
21
|
+
made in transliteration.
|
|
22
|
+
|
|
23
|
+
- |
|
|
24
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
25
|
+
transliteration, with the following exceptions:
|
|
26
|
+
|
|
27
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
28
|
+
b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
|
|
29
|
+
|
|
30
|
+
- This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
|
|
31
|
+
|
|
32
|
+
tests:
|
|
33
|
+
- source: "அழிந்து போன நகரத்தில் , தொலைந்து போன நான்"
|
|
34
|
+
expected: "aḻintu pōṉa nakarattil , tolaintu pōṉa nāṉ"
|
|
35
|
+
- source: "முதன் முதலாக - மை ஃபர்ஸ்ட் சோலோ ட்ராவல்"
|
|
36
|
+
expected: "mutaṉ mutalāka - mai ḵaparsṭ cōlō ṭrāval"
|
|
37
|
+
- source: "வாழ்க்கையில் அவன் போன முதல் சோலோ டிரிப் அது தான்."
|
|
38
|
+
expected: "vāḻkkaiyil avaṉ pōṉa mutal cōlō ṭirip atu tāṉ."
|
|
39
|
+
- source: "ஸ்கூல் ப்ரெண்ட் கார்த்திக் வீட்டுக்கு போய்ட்டு"
|
|
40
|
+
expected: "skūl preṇṭ kārttik vīṭṭukku pōyṭṭu"
|
|
41
|
+
- source: "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ"
|
|
42
|
+
expected: "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
|
|
43
|
+
- source: "நாசா வெளியிட்ட வெடிக்கும் நட்சத்திரத்தின் வீடியோ"
|
|
44
|
+
expected: "nācā veḷiyiṭṭa veṭikkum naṭcattirattiṉ vīṭiyō"
|
|
45
|
+
- source: "டார்பிடோவை ஏவ உதவும் சூப்பர்சானிக் ஏவுகணையான ஸ்மார்ட் சோதனை வெற்றி"
|
|
46
|
+
expected: "ṭārpiṭōvai ēva utavum cūpparcāṉik ēvukaṇaiyāṉa smārṭ cōtaṉai veṟṟi"
|
|
47
|
+
- source: "இந்த ஆண்டு மருத்துவத்துக்கான நோபல் பரிசு பெறுபவர்களின் பெயர்கள் அறிவிப்பு"
|
|
48
|
+
expected: "inta āṇṭu maruttuvattukkāṉa nōpal paricu peṟupavarkaḷiṉ peyarkaḷ aṟivippu"
|
|
49
|
+
- source: "மல்லையா விவகாரம்: பிரிட்டன் அரசின் நடவடிக்கைகள் தங்களுக்கு தெரியவில்லை - மத்திய அரசு தகவல்"
|
|
50
|
+
expected: "mallaiyā vivakāram: piriṭṭaṉ araciṉ naṭavaṭikkaikaḷ taṅkaḷukku teriyavillai - mattiya aracu takaval"
|
|
51
|
+
- source: "ஆலோசனைக்குப் பிறகு தேனியில் இருந்து சென்னை புறப்பட்டார் துணை முதலமைச்சர் பன்னீர்செல்வம்"
|
|
52
|
+
expected: "ālōcaṉaikkup piṟaku tēṉiyil iruntu ceṉṉai puṟappaṭṭār tuṇai mutalamaiccar paṉṉīrcelvam"
|
|
53
|
+
- source: "இன்று தான் பேரன் பிறந்தநாள் முடிந்து ஃப்ரீ ஆகி இருக்கிறேன்"
|
|
54
|
+
expected: "iṉṟu tāṉ pēraṉ piṟantanāḷ muṭintu ḵaprī āki irukkiṟēṉ"
|
|
55
|
+
|
|
56
|
+
map:
|
|
57
|
+
|
|
58
|
+
inherit: 'din-tam-Taml-Latn-33903-2016'
|
|
59
|
+
|
|
60
|
+
characters:
|
|
61
|
+
|
|
62
|
+
'ஃ': 'ḵa'
|
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:tam
|
|
5
|
+
source_script: Taml
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Tamil Romanization, 2011
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: tam_Taml2Latn_ALA_2011
|
|
11
|
+
description: Tamil ALA-Library of Congress 2011 System
|
|
12
|
+
url: https://www.loc.gov/catdir/cpso/romanization/tamil.pdf
|
|
13
|
+
creation_date: 2011
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Tamil
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
|
|
19
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
20
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
21
|
+
made in transliteration.
|
|
22
|
+
|
|
23
|
+
- |
|
|
24
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
25
|
+
transliteration, with the following exceptions:
|
|
26
|
+
|
|
27
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
28
|
+
b) when the absence of any vowel is indicated by the superscript dot ( ் ) called puḷḷi.
|
|
29
|
+
|
|
30
|
+
- This letter has the same form as the vowel sign for ā appearing after a consonant. Where ambiguity arises, it is written.
|
|
31
|
+
|
|
32
|
+
tests:
|
|
33
|
+
- source: "மலையாள நடிகர் சங்கத்திலிருந்து நடிகை பார்வதி திடீர் விலகல்."
|
|
34
|
+
expected: "malaiyāḷa naṭikar caṅkattiliruntu naṭikai pārvati tiṭīr vilakal."
|
|
35
|
+
- source: "சச்சின் டெண்டுல்கரை அலுவலக உதவியாளராக நியமிப்பீர்களா?"
|
|
36
|
+
expected: "cacciṉ ṭeṇṭulkarai aluvalaka utaviyāḷarāka niyamippīrkaḷā?"
|
|
37
|
+
- source: "அமீரகத்தில் தொலைநோக்கி இல்லாமல் நாளை பார்க்கலாம்"
|
|
38
|
+
expected: "amīrakattil tolainōkki illāmal nāḷai pārkkalām"
|
|
39
|
+
- source: "லடாக் யூனியன் பிரதேசம் இந்தியா சட்டவிரோதமாக நிறுவிய ஒரு பகுதி- சீனா மீண்டும் பிடிவாதம்"
|
|
40
|
+
expected: "laṭāk yūṉiyaṉ piratēcam intiyā caṭṭavirōtamāka niṟuviya oru pakuti- cīṉā mīṇṭum piṭivātam"
|
|
41
|
+
- source: "பாலியல் குற்றங்களில் ஈடுபடுவோருக்கு மரண தண்டனை புதிய சட்டம்"
|
|
42
|
+
expected: "pāliyal kuṟṟaṅkaḷil īṭupaṭuvōrukku maraṇa taṇṭaṉai putiya caṭṭam"
|
|
43
|
+
- source: "புதுடெல்லி"
|
|
44
|
+
expected: "putuṭelli"
|
|
45
|
+
- source: "அப்படி விளம்பரத்தில என்ன இருக்கு...?"
|
|
46
|
+
expected: "appaṭi viḷamparattila eṉṉa irukku...?"
|
|
47
|
+
- source: "பூமிக்கும், செவ்வாய் கிரகத்துக்கும் இடையிலான அதிகபட்ச தூரம் ௪௦ கோடியே ௧௩ லட்சம் கி.மீ தொலைவு ஆகும்."
|
|
48
|
+
expected: "pūmikkum, cevvāy kirakattukkum iṭaiyilāṉa atikapaṭca tūram 40 kōṭiyē 13 laṭcam ki.mī tolaivu ākum."
|
|
49
|
+
- source: "அமீரகத்தில் செவ்வாய் கிரகம் குறித்த ஆய்வில் ஈடுபடுவோர் மற்றும் வானியல் நிபுணர்களுக்கு இது ஒரு நல்ல வாய்ப்பாக அமையும்."
|
|
50
|
+
expected: "amīrakattil cevvāy kirakam kuṟitta āyvil īṭupaṭuvōr maṟṟum vāṉiyal nipuṇarkaḷukku itu oru nalla vāyppāka amaiyum."
|
|
51
|
+
- source: "நள்ளிரவு நேரமாக இருந்தால் நமது தலைக்கு மேலே காணலாம். காலை நேரத்தில் மேற்கு மற்றும் தென்மேற்கு திசையில் செவ்வாய் கிரகத்தை பார்க்கலாம்."
|
|
52
|
+
expected: "naḷḷiravu nēramāka iruntāl namatu talaikku mēlē kāṇalām. kālai nērattil mēṟku maṟṟum teṉmēṟku ticaiyil cevvāy kirakattai pārkkalām."
|
|
53
|
+
- source: "வெறும் கண்ணால் பார்க்கும்போது புள்ளியாக ஆரஞ்சு நிறத்தில் பிரகாசமாக தெரியும்."
|
|
54
|
+
expected: "veṟum kaṇṇāl pārkkumpōtu puḷḷiyāka ārañcu niṟattil pirakācamāka teriyum."
|
|
55
|
+
|
|
56
|
+
map:
|
|
57
|
+
|
|
58
|
+
inherit: 'alalc-tam-Taml-Latn-1997'
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: alalc
|
|
3
3
|
id: 1997
|
|
4
|
-
language: ukr
|
|
4
|
+
language: iso-639-2:ukr
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: ALA-LC Romanization System 1997
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: ukr_Cyrl2Latn_ALA_1997
|
|
11
|
+
description: Ukrainian ALA-Library of Congress 1997 System
|
|
8
12
|
url: http://catdir.loc.gov/catdir/cpso/romanization/ukrainia.pdf
|
|
9
13
|
creation_date: 1997
|
|
10
14
|
description: |
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgn
|
|
3
3
|
id: 1943
|
|
4
|
-
language: kor
|
|
4
|
+
language: iso-639-2:kor
|
|
5
5
|
source_script: Hang
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: BGN Agreement -- Korean McCune-Reischauer System (1943)
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: kor_Hang2Latn_MR_1939
|
|
11
|
+
description: Korean McCune-Reischauer System, 1943 US Board on Geographic Names (BGN) Agreement
|
|
8
12
|
url:
|
|
9
13
|
creation_date: 1943
|
|
10
14
|
adoption_date:
|
|
@@ -13,8 +17,8 @@ description:
|
|
|
13
17
|
notes:
|
|
14
18
|
|
|
15
19
|
tests:
|
|
16
|
-
- source:
|
|
17
|
-
expected: "
|
|
20
|
+
- source: 서울
|
|
21
|
+
expected: "Sŏul"
|
|
18
22
|
- source: 평양
|
|
19
23
|
expected: "P’yŏngyang"
|
|
20
24
|
- source: 부산
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgn
|
|
3
3
|
id: 1943
|
|
4
|
-
language: kor
|
|
4
|
+
language: iso-639-2:kor
|
|
5
5
|
source_script: Kore
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: BGN Agreement -- Korean McCune-Reischauer System (1943)
|
|
@@ -13,8 +13,8 @@ description:
|
|
|
13
13
|
notes:
|
|
14
14
|
|
|
15
15
|
tests:
|
|
16
|
-
- source:
|
|
17
|
-
expected: "
|
|
16
|
+
- source: 서울
|
|
17
|
+
expected: "Sŏul"
|
|
18
18
|
- source: 平壤
|
|
19
19
|
expected: "P’yŏngyang"
|
|
20
20
|
- source: 釜山
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
3
|
id: 1967
|
|
4
|
-
language: amh
|
|
4
|
+
language: iso-639-2:amh
|
|
5
5
|
source_script: Ethi
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: BGN/PCGN Romanization System -- Amharic (1967)
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: amh_Ethi2Latn_BGN_1967
|
|
11
|
+
description: Amharic Board on Geographic Names/Permanent Committee on Geographical Names for British Official Use(PCGN) 1967 System
|
|
8
12
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/693663/ROMANIZATION_OF_AMHARIC.pdf
|
|
9
13
|
creation_date: 1967
|
|
10
14
|
description: |
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
3
|
id: 1956
|
|
4
|
-
language: ara
|
|
4
|
+
language: iso-639-2:ara
|
|
5
5
|
source_script: Arab
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: ROMANIZATION OF ARABIC -- BGN/PCGN 1956 System
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: ara_Arab2Latn_BGN_1956
|
|
11
|
+
description: Arabic US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1956 System
|
|
8
12
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/858000/ROMANIZATION_OF_ARABIC.pdf
|
|
9
13
|
creation_date: 1956
|
|
10
14
|
confirmation date: 2019-12
|
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
3
|
id: 1993
|
|
4
|
-
language: aze
|
|
4
|
+
language: iso-639-2:aze
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: AZERBAIJANI TABLE OF CORRESPONDENCES CYRILLIC-ROMAN -- BGN/PCGN 1993 Agreement
|
|
@@ -56,7 +56,7 @@ map:
|
|
|
56
56
|
'\u041C' : 'M'
|
|
57
57
|
'\u041D' : 'N'
|
|
58
58
|
'\u041E' : 'O'
|
|
59
|
-
'\u04E8' : '
|
|
59
|
+
'\u04E8' : 'Ö'
|
|
60
60
|
'\u041F' : 'P'
|
|
61
61
|
'\u0420' : 'R'
|
|
62
62
|
'\u0421' : 'S'
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
3
|
id: 2007
|
|
4
|
-
language: rus
|
|
4
|
+
language: iso-639-2:rus
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: BASHKIR TABLE OF CORRESPONDENCES CYRILLIC-ROMAN BGN/PCGN 2007 Agreement
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: bak_Cyrl2Latn_BGN_2007
|
|
11
|
+
description: Bashkir 2007 BGN/PCGN Cyrillic-Latin Table of Correspondences
|
|
8
12
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/829203/TABLE_OF_CORRESPONDENCES__FOR_BASHKIR.pdf
|
|
9
13
|
creation_date: 2007
|
|
10
14
|
confirmation_date: 2019
|
|
@@ -117,7 +121,7 @@ map:
|
|
|
117
121
|
'\u041D': 'N' # Н
|
|
118
122
|
'\u04A2': 'Ñ' # Ң
|
|
119
123
|
'\u041E': 'O' # О
|
|
120
|
-
'\u04E8': "
|
|
124
|
+
'\u04E8': "Ö" # Ө
|
|
121
125
|
'\u041F': 'P' # П
|
|
122
126
|
'\u0420': 'R' # Р
|
|
123
127
|
'\u0421': 'S' # С
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: bgnpcgn
|
|
3
3
|
id: 1979
|
|
4
|
-
language: bel
|
|
4
|
+
language: iso-639-2:bel
|
|
5
5
|
source_script: Cyrl
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: United States Board on Geographic Names Foreign Names Committee Staff, 1994. Romanization Systems and Roman-Script Spelling Conventions, p. 23.
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: bel_Cyrl2Latn_BGN_1979
|
|
11
|
+
description: Byelorussian US Board on Geographic Names(BGN)/Permanent Committee on Geographical Names for British Official Use(PCGN) 1979 System
|
|
8
12
|
url: https://assets.publishing.service.gov.uk/government/uploads/system/uploads/attachment_data/file/811510/ROMANIZATION_OF_BELARUSIAN.pdf
|
|
9
13
|
creation_date: 1979
|
|
10
14
|
description: |
|