interscript-maps 2.2.1 → 2.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/interscript-maps.gemspec +1 -1
- data/interscript-maps.yaml +26 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +1 -1
- data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
- data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +2 -2
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +2 -3
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
- data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
- data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
- data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-1984.imp +1 -1
- data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +2 -2
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
- data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
- data/maps/odni-ara-Arab-Latn-2004.imp +0 -1
- data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
- data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-fas-Arab-Latn-2004.imp +0 -1
- data/maps/odni-fas-Arab-Latn-2015.imp +3 -3
- data/maps/odni-hin-Deva-Latn-2004.imp +0 -1
- data/maps/odni-hin-Deva-Latn-2015.imp +2 -2
- data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
- data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
- data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
- data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-srp-Cyrl-Latn-2005.imp +0 -1
- data/maps/odni-srp-Cyrl-Latn-2015.imp +1 -3
- data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
- data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
- data/maps/odni-urd-Arab-Latn-2015.imp +2 -3
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
- data/maps/ses-ara-Arab-Latn-1930.imp +3 -46
- data/maps/un-ara-Arab-Latn-1971.imp +1 -1
- data/maps/un-ara-Arab-Latn-1972.imp +1 -1
- data/maps/un-ara-Arab-Latn-2017.imp +2 -2
- data/maps/un-hin-Deva-Latn-2016.imp +1 -1
- data/maps/un-kan-Kana-Latn-2016.imp +1 -1
- data/maps/un-mar-Deva-Latn-2016.imp +1 -1
- data/maps/un-nep-Deva-Latn-1972.imp +1 -1
- data/maps/un-nep-Deva-Latn-2013.imp +1 -1
- data/maps/un-ori-Orya-Latn-1972.imp +1 -1
- data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
- data/maps/un-sin-Sinh-Latn-1972.imp +15 -3
- data/maps/un-urd-Arab-Latn-1972.imp +1 -1
- data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
- data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
- data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
- data/maps/var-mon-Mong-Latn-1930.imp +1 -1
- data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
- data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
- data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
- data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
- metadata +2 -1
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
metadata {
|
|
2
|
+
authority_id: var
|
|
3
|
+
id: rababa
|
|
4
|
+
language: iso-639-2:ara
|
|
5
|
+
source_script: Arab
|
|
6
|
+
destination_script: Latn
|
|
7
|
+
name: RABABA the Arabic Diacritization Library
|
|
8
|
+
url: https://github.com/interscript/rababa/
|
|
9
|
+
description: |
|
|
10
|
+
Arabic diacritization is useful for several practical business cases
|
|
11
|
+
like text to speech or Romanization of Arabic texts or scripts.
|
|
12
|
+
|
|
13
|
+
This map in particular uses the RABABA library to automatically detect
|
|
14
|
+
and add diacritics using machine learning.
|
|
15
|
+
}
|
|
16
|
+
|
|
17
|
+
tests {
|
|
18
|
+
test 'قطر' ,'قِطْرَ'
|
|
19
|
+
test 'abc', 'abc'
|
|
20
|
+
test '‘Iz. Ibrāhīm as-Sa‘danī', '‘Iz. Ibrāhīm as-Sa‘danī'
|
|
21
|
+
}
|
|
22
|
+
|
|
23
|
+
stage {
|
|
24
|
+
rababa config: "200"
|
|
25
|
+
}
|
|
@@ -48,7 +48,7 @@ metadata {
|
|
|
48
48
|
'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
|
|
49
49
|
medial- (vowels), or variant-shaped form.
|
|
50
50
|
|
|
51
|
-
# Note:
|
|
51
|
+
# Note: Provided sample of "Latin 1931-1939" in https://en.m.wikipedia.org/wiki/Mongolian_Latin_alphabet is not actual transliteration.
|
|
52
52
|
# It's kind of buggy transliteration that mixes Cyrillic and Traditional Mongolian script into Latin based on phonetic sound.
|
|
53
53
|
# There is no expected transliteration sources found for the tests.
|
|
54
54
|
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:mon
|
|
5
5
|
source_script: Mong
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: Lessing transliteration system for Uyghur-Mongolian script
|
|
8
8
|
url: https://collab.its.virginia.edu/wiki/tibetan-script/Transliteration%20Schemes%20for%20Mongolian%20Vertical%20Script.html
|
|
9
9
|
creation_date:
|
|
10
10
|
description: |
|
|
@@ -18,7 +18,7 @@ metadata {
|
|
|
18
18
|
|
|
19
19
|
notes:
|
|
20
20
|
- A separated final form of vowels a or e is common, and can appear at the end
|
|
21
|
-
of a word, word stem, or suffix. This form
|
|
21
|
+
of a word, word stem, or suffix. This form requires a final-shaped preceding
|
|
22
22
|
consonant and an inter-word gap in between. The vowels themselves appear as ᠠ,
|
|
23
23
|
and with consonants as ᠬᠠ q‑a, ᠷᠠ r‑a/r‑e, etc. This gap can be transliterated
|
|
24
24
|
with a hyphen. In digital typesetting, these forms are triggered by inserting
|
|
@@ -1,10 +1,10 @@
|
|
|
1
1
|
metadata {
|
|
2
2
|
authority_id: var
|
|
3
|
-
id:
|
|
3
|
+
id: vpmc
|
|
4
4
|
language: iso-639-2:mon
|
|
5
5
|
source_script: Mong
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name:
|
|
7
|
+
name: VPMC transliteration system for Uyghur-Mongolian script
|
|
8
8
|
url: https://collab.its.virginia.edu/wiki/tibetan-script/Transliteration%20Schemes%20for%20Mongolian%20Vertical%20Script.html
|
|
9
9
|
creation_date:
|
|
10
10
|
description: |
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:pra
|
|
5
5
|
source_script: Deva
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: IAST Sanskrit Devanagari System
|
|
7
|
+
name: IAST Sanskrit Devanagari System (Prakrit)
|
|
8
8
|
url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
|
|
9
9
|
creation_date: 1912
|
|
10
10
|
description:
|
|
@@ -4,7 +4,7 @@ metadata {
|
|
|
4
4
|
language: iso-639-2:san
|
|
5
5
|
source_script: Deva
|
|
6
6
|
destination_script: Latn
|
|
7
|
-
name: IAST Sanskrit Devanagari System
|
|
7
|
+
name: IAST Sanskrit Devanagari System (Sanskrit)
|
|
8
8
|
url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
|
|
9
9
|
creation_date: 1912
|
|
10
10
|
description:
|
metadata
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: interscript-maps
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 2.
|
|
4
|
+
version: 2.3.0
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Ribose Inc.
|
|
@@ -299,6 +299,7 @@ files:
|
|
|
299
299
|
- maps/un-ukr-Cyrl-Latn-2012.imp
|
|
300
300
|
- maps/un-urd-Arab-Latn-1972.imp
|
|
301
301
|
- maps/var-amh-Ethi-Latn-eae-2003.imp
|
|
302
|
+
- maps/var-ara-Arab-Arab-rababa.imp
|
|
302
303
|
- maps/var-gez-Ethi-Latn-eae-2003.imp
|
|
303
304
|
- maps/var-hin-Deva-Latn-hunterian-1872.imp
|
|
304
305
|
- maps/var-jpn-Hrkt-Latn-hepburn-1886.imp
|