interscript-maps 2.2.1 → 2.3.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (118) hide show
  1. checksums.yaml +4 -4
  2. data/interscript-maps.gemspec +1 -1
  3. data/interscript-maps.yaml +26 -0
  4. data/maps/alalc-mal-Mlym-Latn-2012.imp +1 -1
  5. data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +1 -1
  6. data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +1 -1
  7. data/maps/bgn-jpn-Hrkt-Latn-1962.imp +1 -1
  8. data/maps/bgn-kor-Hang-Latn-1943.imp +1 -1
  9. data/maps/bgn-kor-Kore-Latn-1943.imp +1 -1
  10. data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +1 -1
  11. data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +4 -1
  12. data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +2 -1
  13. data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +1 -1
  14. data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +2 -2
  15. data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +2 -3
  16. data/maps/bis-asm-Beng-Latn-13194-1991.imp +1 -1
  17. data/maps/bis-ben-Beng-Latn-13194-1991.imp +1 -1
  18. data/maps/bis-dev-Deva-Latn-13194-1991.imp +1 -1
  19. data/maps/bis-guj-Gujr-Latn-13194-1991.imp +1 -1
  20. data/maps/bis-kan-Kana-Latn-13194-1991.imp +1 -1
  21. data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +1 -1
  22. data/maps/bis-ori-Orya-Latn-13194-1991.imp +1 -1
  23. data/maps/bis-pnj-Guru-Latn-13194-1991.imp +1 -1
  24. data/maps/bis-tel-Telu-Latn-13194-1991.imp +1 -1
  25. data/maps/bis-tml-Taml-Latn-13194-1991.imp +1 -1
  26. data/maps/din-hin-Deva-Latn-33904-2018.imp +1 -1
  27. data/maps/din-kat-Geor-Latn-32707-2010.imp +12 -12
  28. data/maps/din-mar-Deva-Latn-33904-2018.imp +1 -1
  29. data/maps/din-nep-Deva-Latn-33904-2018.imp +1 -1
  30. data/maps/din-pli-Deva-Latn-33904-2018.imp +1 -1
  31. data/maps/din-pra-Deva-Latn-33904-2018.imp +1 -1
  32. data/maps/din-san-Deva-Latn-33904-2018.imp +1 -1
  33. data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +1 -2
  34. data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +1 -1
  35. data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +1 -1
  36. data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +1 -1
  37. data/maps/iso-ara-Arab-Latn-233-1984.imp +1 -1
  38. data/maps/iso-ara-Arab-Latn-233-2-1993.imp +1 -1
  39. data/maps/iso-asm-Beng-Latn-15919-2001.imp +1 -1
  40. data/maps/iso-ben-Beng-Latn-15919-2001.imp +1 -1
  41. data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +1 -1
  42. data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +1 -1
  43. data/maps/iso-guj-Gujr-Latn-15919-2001.imp +1 -1
  44. data/maps/iso-hin-Deva-Latn-15919-2001.imp +1 -1
  45. data/maps/iso-inc-Deva-Latn-15919-2001.imp +1 -1
  46. data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +1 -1
  47. data/maps/iso-kan-Kana-Latn-15919-2001.imp +1 -1
  48. data/maps/iso-kat-Geor-Latn-9984-1996.imp +12 -12
  49. data/maps/iso-kor-Hang-Latn-1996-method1.imp +1 -1
  50. data/maps/iso-kor-Hang-Latn-1996-method2.imp +1 -1
  51. data/maps/iso-mal-Mlym-Latn-15919-2001.imp +2 -2
  52. data/maps/iso-mar-Deva-Latn-15919-2001.imp +1 -1
  53. data/maps/iso-nep-Deva-Latn-15919-2001.imp +1 -1
  54. data/maps/iso-ori-Orya-Latn-15919-2001.imp +1 -1
  55. data/maps/iso-pan-Guru-Latn-15919-2001.imp +1 -1
  56. data/maps/iso-pli-Beng-Latn-15919-2001.imp +1 -1
  57. data/maps/iso-pli-Deva-Latn-15919-2001.imp +1 -1
  58. data/maps/iso-pli-Sinh-Latn-15919-2001.imp +1 -1
  59. data/maps/iso-pli-Thai-Latn-15919-2001.imp +1 -1
  60. data/maps/iso-pra-Deva-Latn-15919-2001.imp +1 -1
  61. data/maps/iso-prs-Arab-Latn-233-3-1999.imp +2 -2
  62. data/maps/iso-rus-Cyrl-Latn-9-1995.imp +1 -1
  63. data/maps/iso-san-Deva-Latn-15919-2001.imp +1 -1
  64. data/maps/iso-tam-Taml-Latn-15919-2001.imp +1 -1
  65. data/maps/iso-tel-Telu-Latn-15919-2001.imp +1 -1
  66. data/maps/odni-ara-Arab-Latn-2004.imp +0 -1
  67. data/maps/odni-ara-Arab-Latn-2015.imp +2 -2
  68. data/maps/odni-aze-Cyrl-Latn-2015.imp +1 -1
  69. data/maps/odni-bel-Cyrl-Latn-2015.imp +2 -4
  70. data/maps/odni-bul-Cyrl-Latn-2015.imp +1 -3
  71. data/maps/odni-che-Cyrl-Latn-2015.imp +1 -2
  72. data/maps/odni-fas-Arab-Latn-2004.imp +0 -1
  73. data/maps/odni-fas-Arab-Latn-2015.imp +3 -3
  74. data/maps/odni-hin-Deva-Latn-2004.imp +0 -1
  75. data/maps/odni-hin-Deva-Latn-2015.imp +2 -2
  76. data/maps/odni-kat-Geor-Latn-2015.imp +2 -3
  77. data/maps/odni-kaz-Cyrl-Latn-2015.imp +1 -1
  78. data/maps/odni-kir-Cyrl-Latn-2015.imp +1 -1
  79. data/maps/odni-kor-Hang-Latn-2015.imp +2 -2
  80. data/maps/odni-mkd-Cyrl-Latn-2015.imp +1 -1
  81. data/maps/odni-prs-Arab-Latn-2004.imp +0 -1
  82. data/maps/odni-prs-Arab-Latn-2015.imp +2 -2
  83. data/maps/odni-pus-Arab-Latn-2011.imp +1 -2
  84. data/maps/odni-rus-Cyrl-Latn-2015.imp +1 -3
  85. data/maps/odni-srp-Cyrl-Latn-2005.imp +0 -1
  86. data/maps/odni-srp-Cyrl-Latn-2015.imp +1 -3
  87. data/maps/odni-tat-Cyrl-Latn-2015.imp +1 -1
  88. data/maps/odni-tgk-Cyrl-Latn-2015.imp +1 -1
  89. data/maps/odni-tuk-Cyrl-Latn-2015.imp +1 -2
  90. data/maps/odni-uig-Cyrl-Latn-2015.imp +1 -1
  91. data/maps/odni-ukr-Cyrl-Latn-2015.imp +2 -4
  92. data/maps/odni-urd-Arab-Latn-2015.imp +2 -3
  93. data/maps/odni-uzb-Cyrl-Latn-2015.imp +1 -3
  94. data/maps/ses-ara-Arab-Latn-1930.imp +3 -46
  95. data/maps/un-ara-Arab-Latn-1971.imp +1 -1
  96. data/maps/un-ara-Arab-Latn-1972.imp +1 -1
  97. data/maps/un-ara-Arab-Latn-2017.imp +2 -2
  98. data/maps/un-hin-Deva-Latn-2016.imp +1 -1
  99. data/maps/un-kan-Kana-Latn-2016.imp +1 -1
  100. data/maps/un-mar-Deva-Latn-2016.imp +1 -1
  101. data/maps/un-nep-Deva-Latn-1972.imp +1 -1
  102. data/maps/un-nep-Deva-Latn-2013.imp +1 -1
  103. data/maps/un-ori-Orya-Latn-1972.imp +1 -1
  104. data/maps/un-rus-Cyrl-Latn-1987.imp +1 -1
  105. data/maps/un-sin-Sinh-Latn-1972.imp +15 -3
  106. data/maps/un-urd-Arab-Latn-1972.imp +1 -1
  107. data/maps/var-ara-Arab-Arab-rababa.imp +25 -0
  108. data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +1 -1
  109. data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +1 -1
  110. data/maps/var-kor-Hang-Latn-mr-1939.imp +1 -1
  111. data/maps/var-kor-Kore-Latn-mr-1939.imp +1 -1
  112. data/maps/var-mar-Deva-Latn-hunterian-1872.imp +0 -1
  113. data/maps/var-mon-Mong-Latn-1930.imp +1 -1
  114. data/maps/var-mon-Mong-Latn-lessing.imp +2 -2
  115. data/maps/var-mon-Mong-Latn-vpmc.imp +2 -2
  116. data/maps/var-pra-Deva-Latn-iast-1912.imp +1 -1
  117. data/maps/var-san-Deva-Latn-iast-1912.imp +1 -1
  118. metadata +2 -1
@@ -1,5 +1,5 @@
1
1
  metadata {
2
- authority_id: ungegn
2
+ authority_id: un
3
3
  id: 2017
4
4
  language: iso-639-2:ara
5
5
  source_script: Arab
@@ -0,0 +1,25 @@
1
+ metadata {
2
+ authority_id: var
3
+ id: rababa
4
+ language: iso-639-2:ara
5
+ source_script: Arab
6
+ destination_script: Latn
7
+ name: RABABA the Arabic Diacritization Library
8
+ url: https://github.com/interscript/rababa/
9
+ description: |
10
+ Arabic diacritization is useful for several practical business cases
11
+ like text to speech or Romanization of Arabic texts or scripts.
12
+
13
+ This map in particular uses the RABABA library to automatically detect
14
+ and add diacritics using machine learning.
15
+ }
16
+
17
+ tests {
18
+ test 'قطر' ,'قِطْرَ'
19
+ test 'abc', 'abc'
20
+ test '‘Iz. Ibrāhīm as-Sa‘danī', '‘Iz. Ibrāhīm as-Sa‘danī'
21
+ }
22
+
23
+ stage {
24
+ rababa config: "200"
25
+ }
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:jpn
5
5
  source_script: Hrkt
6
6
  destination_script: Latn
7
- name: Traditional Hepburn
7
+ name: Traditional Hepburn System
8
8
  url: http://www.ab.cyberhome.ne.jp/~kaizu/roomazi/doc/hep3.html
9
9
  creation_date: 1886
10
10
  adoption_date:
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:jpn
5
5
  source_script: Hrkt
6
6
  destination_script: Latn
7
- name: Modified Hepburn
7
+ name: Modified Hepburn System
8
8
  url:
9
9
  creation_date: 1954
10
10
  adoption_date:
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kor
5
5
  source_script: Hang
6
6
  destination_script: Latn
7
- name: McCune-Reischauer System
7
+ name: McCune-Reischauer System (Hangul-Latin)
8
8
  url:
9
9
  creation_date: 1939
10
10
  adoption_date:
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:kor
5
5
  source_script: Hang
6
6
  destination_script: Latn
7
- name: McCune-Reischauer System
7
+ name: McCune-Reischauer System (Korean-Latin)
8
8
  url:
9
9
  creation_date: 1939
10
10
  adoption_date:
@@ -11,7 +11,6 @@ metadata {
11
11
  The Hunterian system is the national system of romanization in India.
12
12
 
13
13
  notes:
14
-
15
14
  - a, i and u are used in word-final position. The a in gaon and the u in pur are not accented.
16
15
  - ज्ञ is transliterated gy.
17
16
  - v is used before i.
@@ -48,7 +48,7 @@ metadata {
48
48
  'the state' etc. Multi-letter suffixes most often start with an initial- (consonants),
49
49
  medial- (vowels), or variant-shaped form.
50
50
 
51
- # Note: Provedid sample of "Latin 1931-1939" in https://en.m.wikipedia.org/wiki/Mongolian_Latin_alphabet is not actual transliteration.
51
+ # Note: Provided sample of "Latin 1931-1939" in https://en.m.wikipedia.org/wiki/Mongolian_Latin_alphabet is not actual transliteration.
52
52
  # It's kind of buggy transliteration that mixes Cyrillic and Traditional Mongolian script into Latin based on phonetic sound.
53
53
  # There is no expected transliteration sources found for the tests.
54
54
 
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Transliteration Systems for Uyghur-Mongolian or Vertical or Old Script
7
+ name: Lessing transliteration system for Uyghur-Mongolian script
8
8
  url: https://collab.its.virginia.edu/wiki/tibetan-script/Transliteration%20Schemes%20for%20Mongolian%20Vertical%20Script.html
9
9
  creation_date:
10
10
  description: |
@@ -18,7 +18,7 @@ metadata {
18
18
 
19
19
  notes:
20
20
  - A separated final form of vowels a or e is common, and can appear at the end
21
- of a word, word stem, or suffix. This form rexuires a final-shaped preceding
21
+ of a word, word stem, or suffix. This form requires a final-shaped preceding
22
22
  consonant and an inter-word gap in between. The vowels themselves appear as ᠎ᠠ,
23
23
  and with consonants as ‍ᠬ᠎ᠠ q‑a, ‍ᠷ᠎ᠠ r‑a/r‑e, etc. This gap can be transliterated
24
24
  with a hyphen. In digital typesetting, these forms are triggered by inserting
@@ -1,10 +1,10 @@
1
1
  metadata {
2
2
  authority_id: var
3
- id: VPMC
3
+ id: vpmc
4
4
  language: iso-639-2:mon
5
5
  source_script: Mong
6
6
  destination_script: Latn
7
- name: Transliteration Systems for Uyghur-Mongolian or Vertical or Old Script
7
+ name: VPMC transliteration system for Uyghur-Mongolian script
8
8
  url: https://collab.its.virginia.edu/wiki/tibetan-script/Transliteration%20Schemes%20for%20Mongolian%20Vertical%20Script.html
9
9
  creation_date:
10
10
  description: |
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:pra
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: IAST Sanskrit Devanagari System
7
+ name: IAST Sanskrit Devanagari System (Prakrit)
8
8
  url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
9
9
  creation_date: 1912
10
10
  description:
@@ -4,7 +4,7 @@ metadata {
4
4
  language: iso-639-2:san
5
5
  source_script: Deva
6
6
  destination_script: Latn
7
- name: IAST Sanskrit Devanagari System
7
+ name: IAST Sanskrit Devanagari System (Sanskrit)
8
8
  url: https://www.ashtangayoga.info/philosophy/sanskrit-and-devanagari/transliteration/pronunciation-transliterations/
9
9
  creation_date: 1912
10
10
  description:
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: interscript-maps
3
3
  version: !ruby/object:Gem::Version
4
- version: 2.2.1
4
+ version: 2.3.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Ribose Inc.
@@ -299,6 +299,7 @@ files:
299
299
  - maps/un-ukr-Cyrl-Latn-2012.imp
300
300
  - maps/un-urd-Arab-Latn-1972.imp
301
301
  - maps/var-amh-Ethi-Latn-eae-2003.imp
302
+ - maps/var-ara-Arab-Arab-rababa.imp
302
303
  - maps/var-gez-Ethi-Latn-eae-2003.imp
303
304
  - maps/var-hin-Deva-Latn-hunterian-1872.imp
304
305
  - maps/var-jpn-Hrkt-Latn-hepburn-1886.imp