interscript 0.1.6 → 0.1.7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/interscript.rb +10 -6
- data/lib/interscript/fs.rb +0 -2
- data/lib/interscript/mapping.rb +1 -1
- data/lib/interscript/opal.rb +38 -8
- data/lib/interscript/opal/entrypoint.rb +12 -0
- data/lib/interscript/opal/map_translate.rb +7 -0
- data/lib/interscript/version.rb +1 -1
- data/maps/acadsin-zho-Hani-Latn-2002.yaml +5 -1
- data/maps/alalc-amh-Ethi-Latn-1997.yaml +5 -1
- data/maps/alalc-amh-Ethi-Latn-2011.yaml +1 -1
- data/maps/alalc-ara-Arab-Latn-1997.yaml +5 -1
- data/maps/alalc-asm-Deva-Latn-1997.yaml +9 -3
- data/maps/alalc-asm-Deva-Latn-2012.yaml +40 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-bel-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ben-Beng-Latn-2017.yaml +1 -1
- data/maps/alalc-bul-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ell-Grek-Latn-1997.yaml +5 -1
- data/maps/alalc-ell-Grek-Latn-2010.yaml +1 -2
- data/maps/alalc-guj-Gujr-Latn-1997.yaml +266 -0
- data/maps/alalc-guj-Gujr-Latn-2011.yaml +64 -0
- data/maps/alalc-hin-Deva-Latn-1997.yaml +211 -0
- data/maps/alalc-hin-Deva-Latn-2011.yaml +47 -0
- data/maps/alalc-kat-Geok-Latn-1997.yaml +1 -1
- data/maps/alalc-kat-Geor-Latn-1997.yaml +5 -1
- data/maps/alalc-kor-Hang-Latn-1997.yaml +5 -1
- data/maps/alalc-mal-Mlym-Latn-1997.yaml +303 -0
- data/maps/alalc-mal-Mlym-Latn-2012.yaml +73 -0
- data/maps/alalc-mar-Deva-Latn-1997.yaml +21 -2
- data/maps/alalc-mar-Deva-Latn-2011.yaml +45 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.yaml +1 -1
- data/maps/alalc-mkd-Cyrl-Latn-2013.yaml +1 -1
- data/maps/alalc-mon-Cyrl-Latn-1997.yaml +220 -0
- data/maps/{alalc-pan-Deva-Latn-1997.yaml → alalc-pan-Guru-Latn-1997.yaml} +23 -4
- data/maps/alalc-pan-Guru-Latn-2011.yaml +78 -0
- data/maps/alalc-per-Arab-Latn-1997.yaml +375 -0
- data/maps/alalc-pli-Deva-Latn-2012.yaml +144 -0
- data/maps/alalc-pra-Deva-Latn-2012.yaml +47 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-rus-Cyrl-Latn-2012.yaml +1 -1
- data/maps/alalc-san-Deva-Latn-2012.yaml +172 -0
- data/maps/alalc-sin-Sinh-Latn-1997.yaml +292 -0
- data/maps/alalc-sin-Sinh-Latn-2011.yaml +71 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-srp-Cyrl-Latn-2013.yaml +1 -1
- data/maps/alalc-tam-Taml-Latn-1997.yaml +62 -0
- data/maps/alalc-tam-Taml-Latn-2011.yaml +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.yaml +5 -1
- data/maps/alalc-ukr-Cyrl-Latn-2011.yaml +1 -1
- data/maps/apcbg-bul-Cyrl-Latn-1995.yaml +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-bss.yaml +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-oss.yaml +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.yaml +1 -1
- data/maps/bgn-kor-Hang-Latn-1943.yaml +7 -3
- data/maps/bgn-kor-Kore-Latn-1943.yaml +3 -3
- data/maps/bgna-bul-Cyrl-Latn-2006.yaml +1 -1
- data/maps/bgna-bul-Cyrl-Latn-2009.yaml +1 -1
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.yaml +5 -1
- data/maps/bgnpcgn-ara-Arab-Latn-1956.yaml +5 -1
- data/maps/bgnpcgn-arm-Armn-Latn-1981.yaml +1 -1
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.yaml +2 -2
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.yaml +6 -2
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.yaml +5 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.yaml +5 -1
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.yaml +5 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.yaml +184 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.yaml +5 -1
- data/maps/bgnpcgn-ell-Grek-Latn-1996.yaml +5 -1
- data/maps/{bgnpcgn-per-Arab-Latn-1956.yaml → bgnpcgn-fas-Arab-Latn-1956.yaml} +5 -1
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.yaml +1 -1
- data/maps/bgnpcgn-kat-Geor-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-kat-Geor-Latn-2009.yaml +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.yaml +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.yaml +1 -1
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.yaml +1 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.yaml +5 -1
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.yaml +1 -1
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.yaml +223 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.yaml +31 -1
- data/maps/bgnpcgn-per-Arab-Latn-1958.yaml +336 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.yaml +639 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.yaml +459 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.yaml +168 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.yaml +5 -1
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.yaml +5 -1
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.yaml +220 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.yaml +240 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.yaml +5 -1
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.yaml +3 -92
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.yaml +127 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.yaml +82 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.yaml +1 -1
- data/maps/bis-asm-Beng-Latn-13194-1991.yaml +1 -1
- data/maps/bis-ben-Beng-Latn-13194-1991.yaml +1 -1
- data/maps/bis-dev-Deva-Latn-13194-1991.yaml +1 -1
- data/maps/{bis-gjr-Gujr-Latn-13194-1991.yaml → bis-guj-Gujr-Latn-13194-1991.yaml} +17 -2
- data/maps/bis-knd-Knda-Latn-13194-1991.yaml +1 -1
- data/maps/bis-mlm-Mlym-Latn-13194-1991.yaml +1 -1
- data/maps/bis-ori-Orya-Latn-13194-1991.yaml +1 -1
- data/maps/bis-pnj-Guru-Latn-13194-1991.yaml +1 -1
- data/maps/bis-tel-Telu-Latn-13194-1991.yaml +1 -1
- data/maps/bis-tml-Taml-Latn-13194-1991.yaml +1 -1
- data/maps/by-bel-Cyrl-Latn-1998.yaml +5 -1
- data/maps/by-bel-Cyrl-Latn-2007.yaml +1 -1
- data/maps/din-grc-Grek-Latn-31634-2011-t1.yaml +899 -0
- data/maps/din-hin-Deva-Latn-33904-2018.yaml +100 -0
- data/maps/din-kat-Geor-Latn-32707-2010.yaml +145 -0
- data/maps/din-mar-Deva-Latn-33904-2018.yaml +84 -0
- data/maps/din-nep-Deva-Latn-33904-2018.yaml +119 -0
- data/maps/din-pli-Deva-Latn-33904-2018.yaml +75 -0
- data/maps/din-pra-Deva-Latn-33904-2018.yaml +63 -0
- data/maps/din-san-Deva-Latn-33904-2018.yaml +338 -0
- data/maps/din-tam-Taml-Latn-33903-2016.yaml +213 -0
- data/maps/dos-nep-Deva-Latn-1997.yaml +15 -1
- data/maps/elot-ell-Grek-Latn-743-1982-tl.yaml +3 -3
- data/maps/elot-ell-Grek-Latn-743-1982-ts.yaml +2 -2
- data/maps/elot-ell-Grek-Latn-743-2001-tl.yaml +2 -2
- data/maps/elot-ell-Grek-Latn-743-2001-ts.yaml +2 -2
- data/maps/ggg-kat-Geor-Latn-2002.yaml +5 -1
- data/maps/gki-bel-Cyrl-Latn-1992.yaml +1 -1
- data/maps/gki-bel-Cyrl-Latn-2000.yaml +1 -1
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.yaml +7 -3
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.yaml +157 -0
- data/maps/hk-yue-Hani-Latn-1888.yaml +1 -1
- data/maps/icao-bel-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-bul-Cyrl-Latn-9303.yaml +1 -1
- data/maps/{icao-per-Arab-Latn-9303.yaml → icao-fas-Arab-Latn-9303.yaml} +1 -1
- data/maps/icao-heb-Hebr-Latn-9303.yaml +1 -1
- data/maps/icao-mkd-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-rus-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-srp-Cyrl-Latn-9303.yaml +1 -1
- data/maps/icao-ukr-Cyrl-Latn-9303.yaml +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.yaml +1 -1
- data/maps/iso-asm-Beng-Latn-15919-2001.yaml +75 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.yaml +175 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.yaml +8 -4
- data/maps/iso-ell-Grek-Latn-843-1997-t2.yaml +8 -4
- data/maps/iso-guj-Gujr-Latn-15919-2001.yaml +220 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.yaml +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.yaml +10 -6
- data/maps/iso-kan-Knda-Latn-15919-2001.yaml +220 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.yaml +145 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.yaml +240 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.yaml +226 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.yaml +281 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.yaml +75 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.yaml +87 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.yaml +193 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.yaml +222 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.yaml +73 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.yaml +74 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.yaml +219 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.yaml +55 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.yaml +59 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.yaml +366 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.yaml +3 -3
- data/maps/iso-san-Deva-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.yaml +159 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.yaml +220 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.yaml +1 -1
- data/maps/kp-kor-Hang-Latn-2002.yaml +25 -17
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.yaml +1 -1
- data/maps/mext-jpn-Hrkt-Latn-1954.yaml +1 -1
- data/maps/mns-mon-Cyrl-Latn-5217-2012.yaml +163 -0
- data/maps/mns-mon-Latn-Cyrl-5217-2012.yaml +200 -0
- data/maps/moct-kor-Hang-Latn-2000.yaml +6 -2
- data/maps/mofa-jpn-Hrkt-Latn-1989.yaml +1 -1
- data/maps/mvd-bel-Cyrl-Latn-2008.yaml +2 -2
- data/maps/mvd-bel-Cyrl-Latn-2010.yaml +3 -3
- data/maps/mvd-rus-Cyrl-Latn-2008.yaml +2 -2
- data/maps/mvd-rus-Cyrl-Latn-2010.yaml +2 -2
- data/maps/odni-ara-Arab-Latn-2015.yaml +425 -0
- data/maps/odni-aze-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-bul-Cyrl-Latn-2015.yaml +2 -2
- data/maps/odni-che-Cyrl-Latn-2015.yaml +169 -0
- data/maps/odni-fas-Arab-Latn-2015.yaml +406 -0
- data/maps/odni-hin-Deva-Latn-2015.yaml +1 -1
- data/maps/odni-kat-Geor-Latn-2015.yaml +1 -1
- data/maps/odni-kaz-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-kor-Hang-Latn-2015.yaml +375 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-per-Arab-Latn-2015.yaml +228 -0
- data/maps/odni-rus-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-srp-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-tat-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-uig-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.yaml +1 -1
- data/maps/odni-urd-Arab-Latn-2015.yaml +1 -1
- data/maps/odni-uzb-Cyrl-Latn-2015.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1939-generic.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1968.yaml +5 -1
- data/maps/royin-tha-Thai-Latn-1999-chained.yaml +1 -1
- data/maps/royin-tha-Thai-Latn-1999.yaml +5 -1
- data/maps/sac-zho-Hans-Latn-1979.yaml +5 -1
- data/maps/sasm-mon-Mong-Latn-general-1978.yaml +389 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.yaml +354 -0
- data/maps/ses-ara-Arab-Latn-1930.yaml +5 -1
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.yaml +1 -1
- data/maps/ua-ukr-Cyrl-Latn-1996.yaml +6 -2
- data/maps/ua-ukr-Cyrl-Latn-2007.yaml +75 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.yaml +192 -0
- data/maps/{ungegn-amh-Ethi-Latn-2016.yaml → un-amh-Ethi-Latn-2016.yaml} +51 -24
- data/maps/un-ara-Arab-Latn-1971.yaml +1 -1
- data/maps/un-ara-Arab-Latn-1972.yaml +1 -1
- data/maps/un-ara-Arab-Latn-2017.yaml +1 -1
- data/maps/un-bel-Cyrl-Latn-2007.yaml +1 -1
- data/maps/un-ben-Beng-Latn-2016.yaml +1 -1
- data/maps/{un-ell-Grek-Latn-phonetic-1987.yaml → un-ell-Grek-Latn-1987-phonetic.yaml} +2 -2
- data/maps/un-ell-Grek-Latn-1987-tl.yaml +2 -2
- data/maps/un-ell-Grek-Latn-1987-ts.yaml +3 -3
- data/maps/un-hin-Deva-Latn-2016.yaml +222 -0
- data/maps/un-mar-Deva-Latn-2016.yaml +91 -0
- data/maps/un-mon-Mong-Latn-general-2013.yaml +264 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.yaml +264 -0
- data/maps/un-nep-Deva-Latn-1972.yaml +204 -17
- data/maps/un-nep-Deva-Latn-2013.yaml +74 -0
- data/maps/un-rus-Cyrl-Latn-1987.yaml +1 -1
- data/maps/un-ukr-Cyrl-Latn-1998.yaml +35 -12
- data/maps/un-ukr-Cyrl-Latn-2012.yaml +162 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.yaml +221 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.yaml +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.yaml +1 -1
- data/maps/{nil-kor-Hang-Hang-jamo.yaml → var-kor-Hang-Hang-jamo.yaml} +1 -1
- data/maps/var-kor-Hang-Latn-mr-1939.yaml +2 -2
- data/maps/var-kor-Kore-Hang-2013.yaml +1 -1
- data/maps/var-kor-Kore-Latn-mr-1939.yaml +1 -1
- data/maps/var-mar-Deva-Latn-hunterian-1872.yaml +43 -0
- data/maps/var-mon-Mong-Latn-1930.yaml +102 -0
- data/maps/var-mon-Mong-Latn-lessing.yaml +272 -0
- data/maps/var-mon-Mong-Latn-vpmc.yaml +274 -0
- data/maps/var-pra-Deva-Latn-iast-1912.yaml +30 -0
- data/maps/var-san-Deva-Latn-iast-1912.yaml +149 -0
- data/maps/var-tha-Thai-Thai-phonemic.yaml +1 -1
- data/maps/var-tha-Thai-Zsym-ipa.yaml +1 -1
- data/maps/{var-zho-Hani-Latn-1979.yaml → var-zho-Hani-Latn-wd-1979.yaml} +6 -2
- data/spec/interscript/filenames_spec.rb +384 -0
- data/spec/interscript_spec.rb +7 -4
- metadata +105 -26
- data/bin/interscript +0 -41
- data/bin/rspec +0 -29
- data/bin/setup +0 -8
- data/lib/__pycache__/g2pwrapper.cpython-38.pyc +0 -0
- data/lib/interscript-opal.rb +0 -2
- data/lib/interscript/opal_map_translate.rb +0 -12
- data/maps/alalc-hin-Deva-Latn-2020.yaml +0 -159
- data/maps/un-mon-Mong-Latn-2013.yaml +0 -99
|
@@ -0,0 +1,64 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:guj
|
|
5
|
+
source_script: Gujr
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Gujarati Romanization, 2011
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: guj_Gujr2Latn_ALA_2011
|
|
11
|
+
description: Gujarati ALA-Library of Congress 2011 System
|
|
12
|
+
url: https://www.loc.gov/catdir/cpso/romanization/gujarati.pdf
|
|
13
|
+
creation_date: 2011
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Gujarati
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
|
|
19
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
20
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
21
|
+
made in transliteration.
|
|
22
|
+
|
|
23
|
+
- |
|
|
24
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
25
|
+
transliteration, with the following exceptions:
|
|
26
|
+
a) when another vowel is indicated by its appropriate sign and
|
|
27
|
+
b) when the absence of any vowel is indicated by the subscript symbol ( ્ ) called halanta or
|
|
28
|
+
virāma.
|
|
29
|
+
|
|
30
|
+
- |
|
|
31
|
+
Exception: Anusvāra is transliterated by:
|
|
32
|
+
a) ṅ before gutturals,
|
|
33
|
+
b) ñ before palatals,
|
|
34
|
+
c) ṇ before cerebrals,
|
|
35
|
+
d) n before dentals, and
|
|
36
|
+
e) m before labials.
|
|
37
|
+
|
|
38
|
+
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
|
39
|
+
|
|
40
|
+
tests:
|
|
41
|
+
- source: "મોર્ગન અને રસેલ ફ્લોપ રહ્યા"
|
|
42
|
+
expected: "mȏrgana anȇ rasȇla phlȏpa rahyā"
|
|
43
|
+
- source: "રોયલ ચેલેન્જર્સ બેંગલોરના કેપ્ટન વિરાટ કોહલીએ કોલકાતા નાઈટ રાઈડર્સ સામે શારજાહ ખાતે ટોસ જીતીને બેટિંગ લીધી છે."
|
|
44
|
+
expected: "rȏyala cȇlȇnjarsa bȇṅgalȏranā kȇpṭana virāṭa kȏhalīȇ kȏlakātā nāīṭa rāīḍarsa sāmȇ śārajāha khātȇ ṭȏsa jītīnȇ bȇṭiṅga līdhī chȇ."
|
|
45
|
+
- source: "અમદાવાદમાં ભણી ચૂકેલા શ્રીકાંત દાતાર પ્રતિષ્ઠિત હાર્વર્ડ બિઝનેસ સ્કૂલના ડીન બન્યા"
|
|
46
|
+
expected: "amadāvādamāṃ bhaṇī cūkȇlā śrīkānta dātāra pratishṭhita hārvarḍa bijhanȇsa skūlanā ḍīna banyā"
|
|
47
|
+
- source: "ઓગસ્ટ મહિનામાં મેન્યુફેક્ચરિંગ સેક્ટરનું ઉત્પાદન ગગડ્યુ"
|
|
48
|
+
expected: "ȏgasṭa mahināmāṃ mȇnyuphȇkcariṅga sȇkṭaranuṃ utpādana gagaḍyu"
|
|
49
|
+
- source: "૯૦ વર્ષમાં બે કરોડમાંથી પોણાબે લાખ કરોડ થઈ ગઈ ટાટા ગ્રુપમાં મિસ્ત્રી પરિવારની શેર્સ વેલ્યુ, જૂના સંબંધો અંત ભણી, જાણો કોને શું મળશે, કોણ શું ગુમાવશે?"
|
|
50
|
+
expected: "90 varshamāṃ bȇ karȏḍamānthī pȏṇābȇ lākha karȏḍa thaī gaī ṭāṭā grupamāṃ mistrī parivāranī śȇrsa vȇlyu, jūnā sambandhȏ anta bhaṇī, jāṇȏ kȏnȇ śuṃ maḷaśȇ, kȏṇa śuṃ gumāvaśȇ?"
|
|
51
|
+
- source: "મુંબઈના એક સ્ટોક બ્રોકરે જણાવ્યું કે ટાટા પોતાના શેર બહાર જતા રોકવા માટે SP ગ્રુપ સાથે સમજૂતી કરી શકે છે."
|
|
52
|
+
expected: "mumbaīnā ȇka sṭȏka brȏkarȇ jaṇāvyuṃ kȇ ṭāṭā pȏtānā śȇra bahāra jatā rȏkavā māṭȇ SP grupa sāthȇ samajūtī karī śakȇ chȇ."
|
|
53
|
+
- source: "કોલકાતા નાઈટ રાઈડર્સનો ઓફ સ્પિનર સુનીલ નારાયણ વિવાદમાં ફસાઈ ગયો છે"
|
|
54
|
+
expected: "kȏlakātā nāīṭa rāīḍarsanȏ ȏpha spinara sunīla nārāyaṇa vivādamāṃ phasāī gayȏ chȇ"
|
|
55
|
+
- source: "ટાટા અને મિસ્ત્રી પરિવાર વચ્ચે શેર્સની આપ-લે થાય એ માટે કોઈ પારસી વ્યક્તિને મધ્યસ્થી બનાવી શકાય છે અને આ માટે રતન ટાટા પણ પ્રયત્નો કરી શકે છે"
|
|
56
|
+
expected: "ṭāṭā anȇ mistrī parivāra vaccȇ śȇrsanī āpa-lȇ thāya ȇ māṭȇ kȏī pārasī vyaktinȇ madhyasthī banāvī śakāya chȇ anȇ ā māṭȇ ratana ṭāṭā paṇa prayatnȏ karī śakȇ chȇ"
|
|
57
|
+
- source: "મેદાની અમ્પાયરોએ પંજાબ વિરુદ્ધની મેચમાં તેની બોલિંગ એક્શન બાબતે શંકા વ્યક્ત કરી હતી. ફરિયાદ પછી હવે નારાયણને વોર્નિંગ લિસ્ટમાં નાખી દેવાયો છે"
|
|
58
|
+
expected: "mȇdānī ampāyarȏȇ pañjāba viruddhanī mȇcamāṃ tȇnī bȏliṅga ȇkśana bābatȇ śaṅkā vyakta karī hatī. phariyāda pachī havȇ nārāyaṇanȇ vȏrniṅga lisṭamāṃ nākhī dȇvāyȏ chȇ"
|
|
59
|
+
- source: "મોદી સરકારના આત્મનિર્ભર ભારત અભિયાનને સફળતા, પાંચ મહિનામાં ચીન સાથેની વેપાર ખાધ અડધી થઈ ગઈ, ચાઈનિઝ સ્માર્ટફોનની હિસ્સેદારી પણ ઘટી"
|
|
60
|
+
expected: "mȏdī sarakāranā ātmanirbhara bhārata abhiyānanȇ saphaḷatā, pāñca mahināmāṃ cīna sāthȇnī vȇpāra khādha aḍadhī thaī gaī, cāīnijha smārṭaphȏnanī hissȇdārī paṇa ghaṭī"
|
|
61
|
+
|
|
62
|
+
map:
|
|
63
|
+
|
|
64
|
+
inherit: 'alalc-guj-Gujr-Latn-1997'
|
|
@@ -0,0 +1,211 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: iso-639-2:hin
|
|
5
|
+
source_script: Deva
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Hindi Romanization, 1997
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: hin_Deva2Latn_ALA_1997
|
|
11
|
+
description: Hindi ALA-Library of Congress 1997 System
|
|
12
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/hindi.pdf
|
|
13
|
+
creation_date: 1997
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Hindi
|
|
16
|
+
|
|
17
|
+
notes:
|
|
18
|
+
|
|
19
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
20
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
21
|
+
made in transliteration.
|
|
22
|
+
|
|
23
|
+
- |
|
|
24
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
25
|
+
transliteration, with the following exceptions:
|
|
26
|
+
|
|
27
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
28
|
+
b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
|
|
29
|
+
virāma.
|
|
30
|
+
|
|
31
|
+
- |
|
|
32
|
+
Exception: Anusvāra is transliterated by:
|
|
33
|
+
|
|
34
|
+
a) ṅ before gutturals,
|
|
35
|
+
b) ñ before palatals,
|
|
36
|
+
c) ṇ before cerebrals,
|
|
37
|
+
d) n before dentals, and
|
|
38
|
+
e) m before labials.
|
|
39
|
+
|
|
40
|
+
- Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
|
|
41
|
+
labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
|
|
42
|
+
|
|
43
|
+
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
|
44
|
+
|
|
45
|
+
tests:
|
|
46
|
+
- source: "हम"
|
|
47
|
+
expected: "hama"
|
|
48
|
+
- source: "मीन"
|
|
49
|
+
expected: "maīna"
|
|
50
|
+
- source: "औसत"
|
|
51
|
+
expected: "ăusata"
|
|
52
|
+
- source: "माँऽऽऽ!"
|
|
53
|
+
expected: "maān̐’’’!"
|
|
54
|
+
- source: "माँ"
|
|
55
|
+
expected: "maām̐"
|
|
56
|
+
- source: "गंभीर मरीजों के मामले में भारत दूसरे नंबर पर"
|
|
57
|
+
expected: "gaṃbhaīra maraījaoṃ kae maāmalae maeṃ bhaārata daūsarae naṃbara para"
|
|
58
|
+
- source: "कोरोना अपडेट्स"
|
|
59
|
+
expected: "kaoraonaā apaḍaeṭasa"
|
|
60
|
+
- source: "सीडीसी चीफ का बयान अहम"
|
|
61
|
+
expected: "saīḍaīsaī caīpha kaā bayaāna ahama"
|
|
62
|
+
- source: "गूगल प्ले स्टोर पर पेटीएम की वापसी"
|
|
63
|
+
expected: "gaūgala palae saṭaora para paeṭaīema kaī vaāpasaī"
|
|
64
|
+
- source: "भारत में गैंबलिंग की इजाजत नहीं"
|
|
65
|
+
expected: "bhaārata maeṃ gaaiṃbalaiṅga kaī ijaājata nahaīṃ"
|
|
66
|
+
- source: "कोरोना वैक्सीन मुद्दे पर घिरे राष्ट्रपति; जो बाइडेन बोले- मुझे और देश को वैज्ञानिकों पर भरोसा है, डोनाल्ड ट्रम्प पर नहीं"
|
|
67
|
+
expected: "kaoraonaā vaaikasaīna maudadae para ghairae raāshaṭarapatai; jao baāiḍaena baolae- maujhae ăura daeśa kao vaaijañaānaikaoṃ para bharaosaā haai, ḍaonaālaḍa ṭaramapa para nahaīṃ"
|
|
68
|
+
- source: "गूगल की कार्रवाई पर पेटीएम ने कहा था कि ऐप को अस्थायी तौर पर प्ले-स्टोर से हटाया गया है, आपके पैसे सुरक्षित हैं"
|
|
69
|
+
expected: "gaūgala kaī kaāraravaāī para paeṭaīema nae kahaā thaā kai aipa kao asathaāyaī taăura para palae-saṭaora sae haṭaāyaā gayaā haai, āpakae paaisae saurakashaita haaiṃ"
|
|
70
|
+
- source: "२५६८७५४४६४४६१६११"
|
|
71
|
+
expected: "2568754464461611"
|
|
72
|
+
|
|
73
|
+
map:
|
|
74
|
+
|
|
75
|
+
rules:
|
|
76
|
+
# note[3]
|
|
77
|
+
- pattern: \u0902(?=[कक़खख़गग़घङ])
|
|
78
|
+
result: ṅ
|
|
79
|
+
- pattern: \u0902(?=[चछजज़झञ])
|
|
80
|
+
result: ñ
|
|
81
|
+
- pattern: \u0902(?=[टट़ठडड़ढढ़ण])
|
|
82
|
+
result: ṇ
|
|
83
|
+
- pattern: \u0902(?=[तथदधन])
|
|
84
|
+
result: n
|
|
85
|
+
# note[4]
|
|
86
|
+
- pattern: (?<=)\u0901(?=\b)
|
|
87
|
+
result: "m̐"
|
|
88
|
+
|
|
89
|
+
characters:
|
|
90
|
+
|
|
91
|
+
# I. Vowels and Diphthongs (see Note 1)
|
|
92
|
+
|
|
93
|
+
'अ': 'a'
|
|
94
|
+
'आ': 'ā'
|
|
95
|
+
'इ': 'i'
|
|
96
|
+
'ई': 'ī'
|
|
97
|
+
'उ': 'u'
|
|
98
|
+
'ऊ': 'ū'
|
|
99
|
+
'ऋ': 'ṛ'
|
|
100
|
+
'ॠ': 'ṝ'
|
|
101
|
+
'ऌ': 'ḷ'
|
|
102
|
+
'ॳ': 'ĕ'
|
|
103
|
+
'ए': 'e'
|
|
104
|
+
'ॲ': 'ê'
|
|
105
|
+
'अै': 'ăi'
|
|
106
|
+
'ऐ': 'ai'
|
|
107
|
+
'ऒ': 'ŏ'
|
|
108
|
+
'ओ': 'o'
|
|
109
|
+
'ऑ': 'ô'
|
|
110
|
+
'औ': 'ău'
|
|
111
|
+
|
|
112
|
+
# II. Consonants (see Note 2)
|
|
113
|
+
# Gutturals
|
|
114
|
+
'क': 'ka'
|
|
115
|
+
'क़': 'qa'
|
|
116
|
+
'ख': 'kha'
|
|
117
|
+
'ख़': 'kha'
|
|
118
|
+
'ग': 'ga'
|
|
119
|
+
'ग़': 'gha'
|
|
120
|
+
'घ': 'gha'
|
|
121
|
+
'ङ': 'ṅa'
|
|
122
|
+
|
|
123
|
+
# Palatals
|
|
124
|
+
'च': 'ca'
|
|
125
|
+
'छ': 'cha'
|
|
126
|
+
'ज': 'ja'
|
|
127
|
+
'ज़': 'ja'
|
|
128
|
+
'झ': 'jha'
|
|
129
|
+
'ञ': 'ña'
|
|
130
|
+
|
|
131
|
+
# Cerebrals
|
|
132
|
+
'ट': 'ṭa'
|
|
133
|
+
'ट़': 't̤a'
|
|
134
|
+
'ठ': 'ṭha'
|
|
135
|
+
'ड': 'ḍa'
|
|
136
|
+
'ड़': 'ṛa'
|
|
137
|
+
'ढ': 'ḍha'
|
|
138
|
+
'ढ़': 'ṛha'
|
|
139
|
+
'ण': 'ṇa'
|
|
140
|
+
|
|
141
|
+
# Dentals
|
|
142
|
+
'त': 'ta'
|
|
143
|
+
'थ': 'tha'
|
|
144
|
+
'द': 'da'
|
|
145
|
+
'ध': 'dha'
|
|
146
|
+
'न': 'na'
|
|
147
|
+
|
|
148
|
+
# Labials
|
|
149
|
+
'प': 'pa'
|
|
150
|
+
'फ': 'pha'
|
|
151
|
+
'फ़': 'pha'
|
|
152
|
+
'ब': 'ba'
|
|
153
|
+
'भ': 'bha'
|
|
154
|
+
'म': 'ma'
|
|
155
|
+
|
|
156
|
+
# Semivowels
|
|
157
|
+
'य': 'ya'
|
|
158
|
+
'र': 'ra'
|
|
159
|
+
'ल': 'la'
|
|
160
|
+
'व': 'va'
|
|
161
|
+
|
|
162
|
+
# Sibilants
|
|
163
|
+
'श': 'śa'
|
|
164
|
+
'ष': 'sha'
|
|
165
|
+
'स': 'sa'
|
|
166
|
+
'स़': 's̤a'
|
|
167
|
+
|
|
168
|
+
# Aspirate
|
|
169
|
+
'ह': 'ha'
|
|
170
|
+
'ह़': 'ha'
|
|
171
|
+
|
|
172
|
+
# Anusvāra
|
|
173
|
+
'ं': 'ṃ'
|
|
174
|
+
|
|
175
|
+
# Bisarga
|
|
176
|
+
'ः ': 'ḥ'
|
|
177
|
+
|
|
178
|
+
# Anunāsika
|
|
179
|
+
'ँ': 'n̐' # ঁ : n̐, m̐
|
|
180
|
+
|
|
181
|
+
# Abagraha
|
|
182
|
+
'ऽ': '’' # (apostrophe)
|
|
183
|
+
|
|
184
|
+
# Medials # Needed for connecting constants
|
|
185
|
+
'ा': "ā"
|
|
186
|
+
'ॉ': "ô"
|
|
187
|
+
'ि': "i"
|
|
188
|
+
'ी': "ī"
|
|
189
|
+
'ु': "u"
|
|
190
|
+
'ू': "ū"
|
|
191
|
+
'ृ': "ṛ"
|
|
192
|
+
'ॄ': "ṝ"
|
|
193
|
+
'े': "e"
|
|
194
|
+
'ॊ': "ŏ"
|
|
195
|
+
'ौ': "ău"
|
|
196
|
+
'ै': "ai"
|
|
197
|
+
'ो': "o"
|
|
198
|
+
'्': ""
|
|
199
|
+
|
|
200
|
+
# digits
|
|
201
|
+
|
|
202
|
+
'०': '0'
|
|
203
|
+
'१': '1'
|
|
204
|
+
'२': '2'
|
|
205
|
+
'३': '3'
|
|
206
|
+
'४': '4'
|
|
207
|
+
'५': '5'
|
|
208
|
+
'६': '6'
|
|
209
|
+
'७': '7'
|
|
210
|
+
'८': '8'
|
|
211
|
+
'९': '9'
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 2011
|
|
4
|
+
language: iso-639-2:hin
|
|
5
|
+
source_script: Deva
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Hindi Romanization, 2011
|
|
8
|
+
url: https://www.loc.gov/catdir/cpso/romanization/hindi.pdf
|
|
9
|
+
creation_date: 1997
|
|
10
|
+
description: |
|
|
11
|
+
ALA-LC Romanization table for Hindi
|
|
12
|
+
|
|
13
|
+
notes:
|
|
14
|
+
|
|
15
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
16
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
17
|
+
made in transliteration.
|
|
18
|
+
|
|
19
|
+
- |
|
|
20
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in
|
|
21
|
+
transliteration, with the following exceptions:
|
|
22
|
+
|
|
23
|
+
a) when another vowel is indicated by its appropriate sign; and
|
|
24
|
+
b) when the absence of any vowel is indicated by the subscript sign ( ◌् ) called halanta or
|
|
25
|
+
virāma.
|
|
26
|
+
|
|
27
|
+
- |
|
|
28
|
+
Exception: Anusvāra is transliterated by:
|
|
29
|
+
|
|
30
|
+
a) ṅ before gutturals,
|
|
31
|
+
b) ñ before palatals,
|
|
32
|
+
c) ṇ before cerebrals,
|
|
33
|
+
d) n before dentals, and
|
|
34
|
+
e) m before labials.
|
|
35
|
+
|
|
36
|
+
- Anunāsika before guttural, palatal, cerebral, and dental occlusives is transliterated n̐. Before
|
|
37
|
+
labials, sibilants, semivowels, aspirates, vowels, and in final position it is transliterated m̐.
|
|
38
|
+
|
|
39
|
+
- When doubled, avagraha is transliterated by two apostrophes ( ’’ ).
|
|
40
|
+
|
|
41
|
+
tests:
|
|
42
|
+
- source: "इस चुनौतीपूर्ण समय में 'वर्क फ्रॉम होम’ सामान्य बन चुका है"
|
|
43
|
+
expected: "isa caunaăutaīpaūraṇa samaya maeṃ 'varaka pharaôma haoma’ saāmaānaya bana caukaā haai"
|
|
44
|
+
|
|
45
|
+
map:
|
|
46
|
+
|
|
47
|
+
inherit: "alalc-hin-Deva-Latn-1997"
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: alalc
|
|
3
3
|
id: 1997
|
|
4
|
-
language: kat
|
|
4
|
+
language: iso-639-2:kat
|
|
5
5
|
source_script: Geor
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: ALA-LC Georgian System (1997)
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: kat_Geor2Latn_ALA_1997
|
|
11
|
+
description: Georgian ALA-Library of Congress 1997 System
|
|
8
12
|
url: https://www.loc.gov/catdir/cpso/romanization/georgian.pdf
|
|
9
13
|
creation_date: 1997
|
|
10
14
|
confirmation_date: 1997
|
|
@@ -1,10 +1,14 @@
|
|
|
1
1
|
---
|
|
2
2
|
authority_id: alalc
|
|
3
3
|
id: 1997
|
|
4
|
-
language: kor
|
|
4
|
+
language: iso-639-2:kor
|
|
5
5
|
source_script: Hang
|
|
6
6
|
destination_script: Latn
|
|
7
7
|
name: ALA-LC Romanization Table -- Korean (1997)
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: kor_Hang2Latn_ALA_1997
|
|
11
|
+
description: Korean ALA-Library of Congress 1997 System
|
|
8
12
|
url: http://catdir.loc.gov/catdir/cpso/romanization/korean.pdf
|
|
9
13
|
creation_date: 1997
|
|
10
14
|
adoption_date:
|
|
@@ -0,0 +1,303 @@
|
|
|
1
|
+
---
|
|
2
|
+
authority_id: alalc
|
|
3
|
+
id: 1997
|
|
4
|
+
language: iso-639-2:mal
|
|
5
|
+
source_script: Mlym
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: Malayalam Romanization, 1997
|
|
8
|
+
alias:
|
|
9
|
+
ogc11122:
|
|
10
|
+
code: mal_Mlym2Latn_ALA_1997
|
|
11
|
+
description: Malayalam ALA-Library of Congress 1997 System
|
|
12
|
+
url: http://catdir.loc.gov/catdir/cpso/romanization/malayala.pdf
|
|
13
|
+
creation_date: 1997
|
|
14
|
+
description: |
|
|
15
|
+
ALA-LC Romanization table for Malayalam
|
|
16
|
+
|
|
17
|
+
|
|
18
|
+
notes:
|
|
19
|
+
|
|
20
|
+
- Only the vowel forms that appear at the beginning of a syllable are listed; the forms used for
|
|
21
|
+
vowels following a consonant can be found in grammars; no distinction between the two is
|
|
22
|
+
made in transliteration.
|
|
23
|
+
|
|
24
|
+
- When ് is used in combination with the vowel u (ഉ്), the combination is also transliterated ȧ.
|
|
25
|
+
|
|
26
|
+
- |
|
|
27
|
+
The vowel a is implicit after all consonants and consonant clusters and is supplied in transliteration, with the following exceptions:
|
|
28
|
+
a) when another vowel is indicated by its appropriate sign
|
|
29
|
+
b) when the absence of any vowel is indicated by the superscript sign ് (also used for the vowel ȧ); and
|
|
30
|
+
c) when the following modified consonantal forms are used:
|
|
31
|
+
ൿ k
|
|
32
|
+
ൻ n
|
|
33
|
+
ൾ ḷ
|
|
34
|
+
ൺ ṇ
|
|
35
|
+
ൽ l
|
|
36
|
+
ർ r
|
|
37
|
+
- When റ റ appears as a subscript in a cluster (റ്റ), it is transliterated ta.
|
|
38
|
+
|
|
39
|
+
- |
|
|
40
|
+
Exception: Anusvāra is transliterated by:
|
|
41
|
+
|
|
42
|
+
a) ṅ before gutturals,
|
|
43
|
+
b) ñ before palatals,
|
|
44
|
+
c) ṇ before cerebrals,
|
|
45
|
+
d) n before dentals, and
|
|
46
|
+
e) m before labials.
|
|
47
|
+
|
|
48
|
+
tests:
|
|
49
|
+
- source: "ചൈനയ്ക്കെതിരെ ലഡാക്കിൽ സദാസജ്ജം; യുഎസിൽനിന്ന് ൭൨,൫൦൦ സിഗ്–൧൬ റൈഫിൾ"
|
|
50
|
+
expected: "cainayŭkŭketire lad̂ākŭkil sadāsajŭjaṃ; yuesilninŭnŭ 72,500 sigŭ–16 ṟaiphiḷ"
|
|
51
|
+
- source: "സർഗഭൂമിക’യ്ക്കില്ല; ലളിതച്ചേച്ചി അങ്ങനെ പറഞ്ഞിട്ടുണ്ടാവില്ല: ആർഎൽവി രാമകൃഷ്ണൻ"
|
|
52
|
+
expected: "sargabhūmika’yŭkŭkilŭla; laḷitacŭcēcŭci aṅŭṅane paṟañŭñiṭŭṭuṇŭṭāvilŭla: ārelvi rāmakṛṣŭṇan"
|
|
53
|
+
- source: "സ്വർണക്കടത്ത്: ഫൈസൽ ഫരീദും റബിന്സും ദുബായിൽ അറസ്റ്റിലായെന്ന് എന്ഐഎ"
|
|
54
|
+
expected: "sŭvarṇakŭkaṭatŭtŭ: phaisal pharīduṃ ṟabinŭsuṃ dubāyil aṟasŭṟŭṟilāyenŭnŭ enŭaie"
|
|
55
|
+
- source: "വരുമോ ചൈനയുടെ വാക്സീൻ?; ആഗോള ഉപയോഗത്തിന് ഡബ്ല്യുഎച്ച്ഒയുമായി ചർച്ച"
|
|
56
|
+
expected: "varumō cainayuṭe vākŭsīn?; āgōḷa upayōgatŭtinŭ d̂abŭlŭyuecŭcŭoyumāyi carcŭca"
|
|
57
|
+
- source: "കുട്ടികളുടെ മാനസിക പിരിമുറുക്കം മാറ്റാൻ പരിശീലനം; ക്ലാസുമായി പോക്സോ പ്രതി"
|
|
58
|
+
expected: "kuṭŭṭikaḷuṭe mānasika pirimuṟukŭkaṃ māṟŭṟān pariśīlanaṃ; kŭlāsumāyi pōkŭsō pŭrati"
|
|
59
|
+
- source: "ആദ്യം അമിത് ഷാ, ഇപ്പോൾ മോദി; ബിജെപിയെ പുണരാൻ ജഗൻ; ആന്ധ്രയിലെ കരുനീക്കങ്ങൾ"
|
|
60
|
+
expected: "ādŭyaṃ amitŭ ṣā, ipŭpōḷ mōdi; bijepiye puṇarān jagan; ānŭdhŭrayile karunīkŭkaṅŭṅaḷ"
|
|
61
|
+
- source: "ലഹരിമരുന്ന് കേസ്: ബിനീഷ് കോടിയേരിയെ ഇഡി 6 മണിക്കൂർ ചോദ്യം ചെയ്തു"
|
|
62
|
+
expected: "laharimarunŭnŭ kēsŭ: binīṣŭ kōṭiyēriye id̂i 6 maṇikŭkūr cōdŭyaṃ ceyŭtu"
|
|
63
|
+
- source: "ഈന്തപ്പഴം വിതരണം ചെയ്തത് ശിവശങ്കര് പറഞ്ഞതു പ്രകാരം: ടി.വി അനുപമയുടെ മൊഴി"
|
|
64
|
+
expected: "īnŭtapŭpaḻaṃ vitaraṇaṃ ceyŭtatŭ śivaśaṅŭkarŭ paṟañŭñatu pŭrakāraṃ: ṭi.vi anupamayuṭe moḻi"
|
|
65
|
+
- source: "൫൦൦൦ മണിക്കൂർ കാത്തിരിക്കാൻ തയാറെന്ന് രാഹുൽ: ഒടുവിൽ വഴങ്ങി ഹരിയാന"
|
|
66
|
+
expected: "5000 maṇikŭkūr kātŭtirikŭkān tayāṟenŭnŭ rāhul: oṭuvil vaḻaṅŭṅi hariyāna"
|
|
67
|
+
- source: "കാരണം ഷോര്ട്ട്സര്ക്യൂട്ടല്ല; കത്തിയത് ഫയല് മാത്രം, സാനിറ്റൈസര് ഉള്പ്പെടെ കത്തിയില്ല"
|
|
68
|
+
expected: "kāraṇaṃ ṣōrŭṭŭṭŭsarŭkŭyūṭŭṭalŭla; katŭtiyatŭ phayalŭ mātŭraṃ, sāniṟŭṟaisarŭ uḷŭpŭpeṭe katŭtiyilŭla"
|
|
69
|
+
- source: "വിമൺ സയൻറിസ്റ്റ്സ് സ്കീം"
|
|
70
|
+
expected: "vimaṇ sayanṟisŭṟŭṟŭsŭ sŭkīṃ"
|
|
71
|
+
|
|
72
|
+
map:
|
|
73
|
+
|
|
74
|
+
rules:
|
|
75
|
+
# note[5]
|
|
76
|
+
- pattern: \u0DCA(?=[കഖഗഘങ])
|
|
77
|
+
result: ṅ
|
|
78
|
+
- pattern: \u0DCA(?=[ചഛജഝഞ])
|
|
79
|
+
result: ñ
|
|
80
|
+
- pattern: \u0DCA(?=[ടഠഡഢണ])
|
|
81
|
+
result: ṇ
|
|
82
|
+
- pattern: \u0DCA(?=[തഥദധന])
|
|
83
|
+
result: n
|
|
84
|
+
|
|
85
|
+
# note[3(a,b)]
|
|
86
|
+
- pattern: (['ക']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
87
|
+
result: 'k'
|
|
88
|
+
- pattern: (['ഖ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
89
|
+
result: 'kh'
|
|
90
|
+
- pattern: (['ഗ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
91
|
+
result: 'g'
|
|
92
|
+
- pattern: (['ഘ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
93
|
+
result: 'gh'
|
|
94
|
+
- pattern: (['ങ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
95
|
+
result: 'ṅ'
|
|
96
|
+
- pattern: (['ച']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
97
|
+
result: 'c'
|
|
98
|
+
- pattern: (['ഛ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
99
|
+
result: 'ch'
|
|
100
|
+
- pattern: (['ജ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
101
|
+
result: 'j'
|
|
102
|
+
- pattern: (['ഝ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
103
|
+
result: 'jh'
|
|
104
|
+
- pattern: (['ഞ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
105
|
+
result: 'ñ'
|
|
106
|
+
- pattern: (['ട']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
107
|
+
result: 'ṭ'
|
|
108
|
+
- pattern: (['ഠ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
109
|
+
result: 'ṭh'
|
|
110
|
+
- pattern: (['ഡ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
111
|
+
result: 'd̂'
|
|
112
|
+
- pattern: (['ഢ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
113
|
+
result: 'ḍh'
|
|
114
|
+
- pattern: (['ണ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
115
|
+
result: 'ṇ'
|
|
116
|
+
- pattern: (['ത']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
117
|
+
result: 't'
|
|
118
|
+
- pattern: (['ഥ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
119
|
+
result: 'th'
|
|
120
|
+
- pattern: (['ദ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
121
|
+
result: 'd'
|
|
122
|
+
- pattern: (['ധ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
123
|
+
result: 'dh'
|
|
124
|
+
- pattern: (['ന']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
125
|
+
result: 'n'
|
|
126
|
+
- pattern: (['പ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
127
|
+
result: 'p'
|
|
128
|
+
- pattern: (['ഫ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
129
|
+
result: 'ph'
|
|
130
|
+
- pattern: (['ബ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
131
|
+
result: 'b'
|
|
132
|
+
- pattern: (['ഭ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
133
|
+
result: 'bh'
|
|
134
|
+
- pattern: (['മ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
135
|
+
result: 'm'
|
|
136
|
+
- pattern: (['യ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
137
|
+
result: 'y'
|
|
138
|
+
- pattern: (['ര']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
139
|
+
result: 'r'
|
|
140
|
+
- pattern: (['റ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
141
|
+
result: 'ṟ'
|
|
142
|
+
- pattern: (['ല']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
143
|
+
result: 'l'
|
|
144
|
+
- pattern: (['ള']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
145
|
+
result: 'ḷ'
|
|
146
|
+
- pattern: (['ഴ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
147
|
+
result: 'ḻ'
|
|
148
|
+
- pattern: (['വ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
149
|
+
result: 'v'
|
|
150
|
+
- pattern: (['ശ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
151
|
+
result: 'ś'
|
|
152
|
+
- pattern: (['ഷ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
153
|
+
result: 'ṣ'
|
|
154
|
+
- pattern: (['സ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
155
|
+
result: 's'
|
|
156
|
+
- pattern: (['ഩ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
157
|
+
result: 'ṉ'
|
|
158
|
+
- pattern: (['ഹ']=?)(?=[\u0d3e\u0d3f\u0d40\u0d41\u0d42\u0d4d\u0d43\u0d44\u0d46\u0d47\u0d48\u0d4a\u0d4b\u0d4c\u0D62\u0D63\u0d4d])
|
|
159
|
+
result: 'h'
|
|
160
|
+
|
|
161
|
+
|
|
162
|
+
|
|
163
|
+
characters:
|
|
164
|
+
|
|
165
|
+
'അ': 'a'
|
|
166
|
+
'ആ': 'ā'
|
|
167
|
+
'ഇ': 'i'
|
|
168
|
+
'ഈ': 'ī'
|
|
169
|
+
'ഉ': 'u'
|
|
170
|
+
'ഊ': 'ū'
|
|
171
|
+
'ഋ': "ṛ"
|
|
172
|
+
'ൠ': "ṝ"
|
|
173
|
+
'ഌ': "ḷ"
|
|
174
|
+
'ൡ': "ḹ"
|
|
175
|
+
|
|
176
|
+
'എ': 'e'
|
|
177
|
+
'ഏ': 'ē'
|
|
178
|
+
'ഐ': 'ai'
|
|
179
|
+
|
|
180
|
+
'ഒ': 'o'
|
|
181
|
+
'ഓ': 'ō'
|
|
182
|
+
'ഔ': 'au'
|
|
183
|
+
|
|
184
|
+
# Consonants
|
|
185
|
+
# Gutturals
|
|
186
|
+
'ക': 'ka'
|
|
187
|
+
'ഖ': 'kha'
|
|
188
|
+
'ഗ': 'ga'
|
|
189
|
+
'ഘ': 'gha'
|
|
190
|
+
'ങ': 'ṅa'
|
|
191
|
+
|
|
192
|
+
# Palatals
|
|
193
|
+
'ച': 'ca'
|
|
194
|
+
'ഛ': 'cha'
|
|
195
|
+
'ജ': 'ja'
|
|
196
|
+
'ഝ': 'jha'
|
|
197
|
+
'ഞ': 'ña'
|
|
198
|
+
|
|
199
|
+
# Cerebrals
|
|
200
|
+
'ട': 'ṭa'
|
|
201
|
+
'ഠ': 'ṭha'
|
|
202
|
+
'ഡ': 'd̂a'
|
|
203
|
+
'ഢ': 'ḍha'
|
|
204
|
+
'ണ': 'ṇa'
|
|
205
|
+
|
|
206
|
+
# Dentals
|
|
207
|
+
'ത': 'ta'
|
|
208
|
+
'ഥ': 'tha'
|
|
209
|
+
'ദ': 'da'
|
|
210
|
+
'ധ': 'dha'
|
|
211
|
+
'ന': 'na'
|
|
212
|
+
|
|
213
|
+
# Labials
|
|
214
|
+
'പ': 'pa'
|
|
215
|
+
'ഫ': 'pha'
|
|
216
|
+
'ബ': 'ba'
|
|
217
|
+
'ഭ': 'bha'
|
|
218
|
+
'മ': 'ma'
|
|
219
|
+
|
|
220
|
+
# Semivowels
|
|
221
|
+
'യ': 'ya'
|
|
222
|
+
'ര': 'ra'
|
|
223
|
+
'റ': 'ṟa'
|
|
224
|
+
'റ്റ': 'ṯṯa' # (see Note 4)
|
|
225
|
+
'ല': 'la'
|
|
226
|
+
'ള': 'ḷa'
|
|
227
|
+
'ഴ': 'ḻa'
|
|
228
|
+
# Sibilants
|
|
229
|
+
'വ': 'va'
|
|
230
|
+
'ശ': 'śa'
|
|
231
|
+
'ഷ': 'ṣa'
|
|
232
|
+
'സ': 'sa'
|
|
233
|
+
'ഩ': 'ṉa'
|
|
234
|
+
|
|
235
|
+
|
|
236
|
+
# Aspirate
|
|
237
|
+
'ഹ': 'ha'
|
|
238
|
+
|
|
239
|
+
# Bisarga
|
|
240
|
+
'ഃ': 'ḥ'
|
|
241
|
+
|
|
242
|
+
# Anusvāra
|
|
243
|
+
'ം': 'ṃ'
|
|
244
|
+
|
|
245
|
+
|
|
246
|
+
# Abagraha
|
|
247
|
+
'ഽ': ':’' # (apostrophe)
|
|
248
|
+
|
|
249
|
+
# Medials # Needed for connecting constants
|
|
250
|
+
|
|
251
|
+
'ാ': 'ā'
|
|
252
|
+
'ി': 'i'
|
|
253
|
+
'ീ': 'ī'
|
|
254
|
+
'ു': 'u'
|
|
255
|
+
'ൂ': 'ū'
|
|
256
|
+
'്': 'ŭ'
|
|
257
|
+
'ൃ': "ṛ"
|
|
258
|
+
'ൄ': "ṝ"
|
|
259
|
+
'\u0D62': "ḷ"
|
|
260
|
+
'\u0D63': "ḹ"
|
|
261
|
+
'െ': "e"
|
|
262
|
+
'േ': "ē"
|
|
263
|
+
'ൈ': "ai"
|
|
264
|
+
'ൊ': 'o'
|
|
265
|
+
'ോ': 'ō'
|
|
266
|
+
'ൌ': 'au'
|
|
267
|
+
|
|
268
|
+
'्': ''
|
|
269
|
+
'़': ''
|
|
270
|
+
'ൗ': ''
|
|
271
|
+
"": '' # no need for zero with joiner
|
|
272
|
+
"": '' # no need for zero with non joiner
|
|
273
|
+
|
|
274
|
+
|
|
275
|
+
# numbers
|
|
276
|
+
'൦': '0'
|
|
277
|
+
'൧': '1'
|
|
278
|
+
'൨': '2'
|
|
279
|
+
'൩': '3'
|
|
280
|
+
'൪': '4'
|
|
281
|
+
'൫': '5'
|
|
282
|
+
'൬': '6'
|
|
283
|
+
'൭': '7'
|
|
284
|
+
'൮': '8'
|
|
285
|
+
'൯': '9'
|
|
286
|
+
'൰': '10'
|
|
287
|
+
'൱': '100'
|
|
288
|
+
'൲': '1000'
|
|
289
|
+
|
|
290
|
+
|
|
291
|
+
# Note 3(c)
|
|
292
|
+
|
|
293
|
+
'ൿ': 'k'
|
|
294
|
+
'ൺ': 'ṇ'
|
|
295
|
+
'ൻ': 'n'
|
|
296
|
+
'ൽ': 'l'
|
|
297
|
+
'ൾ': 'ḷ'
|
|
298
|
+
'ർ': 'r'
|
|
299
|
+
'ഉ്': 'ū'
|
|
300
|
+
|
|
301
|
+
# extended and ancient forms
|
|
302
|
+
|
|
303
|
+
'ഺ': 'ṯa'
|