interscript-maps 2.1.0a9 → 2.1.0b1

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 787f7a3ee5db4f80a918eccb4946d7b6dc0b79a9b9dc0bdb7d5dbe2492418661
4
- data.tar.gz: 5394992e449ef98b9fd1013ed96c89227a2386c96a968986949749d1090720e5
3
+ metadata.gz: 8b43dc37aa94446eb83bfececb00291e1fe7ebf17c11e7f0a11969196d33f179
4
+ data.tar.gz: c919d5084e1ac1e97985e0357bacdf282611d8717ae72175e18ed7f2e74d3582
5
5
  SHA512:
6
- metadata.gz: 86ac00b08f434be0192a6dc2af179e51b4df6b688644f78a40b4671c82de6ad0672954bf156477f7be677fb96ad417dce2ca8c63e47b01e3bcdb078403b4a2ca
7
- data.tar.gz: 545f34e8f83bf57d77064b50f8089ceb5ae4a062b027f25aefe16bf208df354efc4764067cd3ab7c02b576d5c89a41797e441abeaab73fb85a4d88d6776755ed
6
+ metadata.gz: c4df63fb4c1c30c63cf11c5ea61b727001d14840f856073de1c65eaaa59153e5ba9c3918ec9ba234a3dcc4e945331b3247d8667545b0fe75c9854b75472b9f62
7
+ data.tar.gz: db7750b60fbab7dcef42d4e05fd3320a41f06c2c2ed8639aae6ddb52be547e73d0e8c7e6e59b2f7134c3e2274c695226bea148bff71989db47fd31a7c1f32da2
@@ -1,4 +1,4 @@
1
- INTERSCRIPT_MAPS_VERSION="2.1.0a9"
1
+ INTERSCRIPT_MAPS_VERSION="2.1.0b1"
2
2
 
3
3
  Gem::Specification.new do |spec|
4
4
  spec.name = "interscript-maps"
@@ -7,15 +7,16 @@ metadata {
7
7
  name: Hong Kong Government Cantonese Romanisation
8
8
  url: http://caes.hku.hk/hkjalonline/issues/download_the_file.php?f=2008_v11_1_kataoka__n__lee.pdf
9
9
  creation_date: 2020-01
10
- description:
11
- - This system is commonly used for the transliteration of place names or
12
- person's names in Hong Kong, as pronounced in Cantonese. There will be more
13
- than one legitimate transliteration for the same syllable, or sometimes even
14
- for the same character. For example, the character 仔 can be transcribed as
15
- Chai or Tsai in this system. Some of the choice is context-depenedent (e.g.
16
- the same character in the place name 灣仔 is almost always Chai, but more likely
17
- to be Tsai elsewhere). There will be more variations and unpredictabilities in
18
- person's names, and these conventions need to be hard-coded.
10
+ description: |
11
+ This system is commonly used for the transliteration of place names or
12
+ person's names in Hong Kong, as pronounced in Cantonese. There will be more
13
+ than one legitimate transliteration for the same syllable, or sometimes even
14
+ for the same character. For example, the character 仔 can be transcribed as
15
+ Chai or Tsai in this system. Some of the choice is context-dependent (e.g.
16
+ the same character in the place name 灣仔 is almost always Chai, but more
17
+ likely to be Tsai elsewhere). There will be more variations and
18
+ unpredictable conversions in person's names, and these conventions need to
19
+ be hard-coded.
19
20
 
20
21
  notes:
21
22
  - Tone is not represented in this system.
@@ -27,10 +28,9 @@ metadata {
27
28
  distinctions were represented by ’ or diacritics (e.g. á vs. a), but were
28
29
  removed in printed / typeset documents.
29
30
 
30
-
31
- #A longer test list will be generated from GeoNames database
32
31
  }
33
32
 
33
+ # TODO: A longer test list will be generated from GeoNames database
34
34
  tests {
35
35
  test "煎魚灣", "Tsin Yue Wan"
36
36
  test "分流廟灣", "Fan Lau Miu Wan"
@@ -38,7 +38,7 @@ metadata {
38
38
  غ is ġ instead of gh
39
39
  ة is ẗ instead of h/t
40
40
  ى is ỳ
41
- ـِي is iy instead of iy
41
+ ـِي is iy instead of ī
42
42
  ـُو is uw instead of ū
43
43
  ـَا is a’ instead of ā
44
44
  ـَى is aỳ instead of á
@@ -55,7 +55,6 @@ tests {
55
55
 
56
56
  stage {
57
57
 
58
-
59
58
  # CHARACTERS
60
59
  parallel {
61
60
 
@@ -105,7 +104,6 @@ stage {
105
104
 
106
105
  # Shadda
107
106
 
108
-
109
107
  sub "\u0628\u0651", "bb" # ب
110
108
  sub "\u062a\u0651", "tt" # ت
111
109
  sub "\u062b\u0651", "ṯṯ" # ث
@@ -133,7 +131,6 @@ stage {
133
131
  sub "\u0648\u0651", "ww" # و
134
132
  sub "\u064a\u0651", "yy" # ي
135
133
 
136
-
137
134
  sub "\u0622", "’â" # آ
138
135
 
139
136
  sub "\u0627", "â" # ا
@@ -142,7 +139,6 @@ stage {
142
139
 
143
140
  sub "\u0626", "'" # ئ
144
141
 
145
-
146
142
  sub "\u0621", maybe("’") # ء# see note A
147
143
 
148
144
  sub "\u0623", "a" # أ
@@ -86,14 +86,14 @@ tests {
86
86
  stage {
87
87
 
88
88
  # RULES
89
- sub capture("\u2019\u0415"), "Je" # Е
90
- sub capture("\u2019\u0435"), "je" # е
91
- sub capture("\u2019\u0401"), "Jo" # Ë
92
- sub capture("\u2019\u0451"), "jo" # ё
93
- sub capture("\u2019\u042E"), "Ju" # Ю
94
- sub capture("\u2019\u044E"), "ju" # ю
95
- sub capture("\u2019\u042F"), "Ja" # Я
96
- sub capture("\u2019\u044F"), "ja" # я
89
+ sub "\u2019\u0415", "Je" # Е
90
+ sub "\u2019\u0435", "je" # е
91
+ sub "\u2019\u0401", "Jo" # Ë
92
+ sub "\u2019\u0451", "jo" # ё
93
+ sub "\u2019\u042E", "Ju" # Ю
94
+ sub "\u2019\u044E", "ju" # ю
95
+ sub "\u2019\u042F", "Ja" # Я
96
+ sub "\u2019\u044F", "ja" # я
97
97
 
98
98
  sub "\u0415", "Je", before: any("АаЕеЁёИиОоУуЭэЮюЯяЬьЎў") # Е after vowels
99
99
  sub "\u0435", "je", before: any("АаЕеЁёИиОоУуЭэЮюЯяЬьЎў") # е after vowels
@@ -43,8 +43,9 @@ stage {
43
43
 
44
44
  # RULES
45
45
  # note[5]
46
- sub "\u044C", ref( 1 ), before: any("ЗзЛлНнСсЦц") # ь after consonants
47
- sub "\u02B9", ref( 1 ), before: any("ЗзЛлНнСсЦц") # Ь after consonants
46
+ # Those two are nonsense and harmful for reversibility
47
+ # sub "\u044C", ref( 1 ), before: any("ЗзЛлНнСсЦц") # ь after consonants
48
+ # sub "\u02B9", ref( 1 ), before: any("ЗзЛлНнСсЦц") # Ь after consonants
48
49
  # Й at end
49
50
  sub "\u0419" + line_end, "", before: any("ЕеЁёЫыЮюЯя") # Я after vowels
50
51
  sub "\u0439" + line_end, "", before: any("ЕеЁёЫыЮюЯя") # я after vowels
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: interscript-maps
3
3
  version: !ruby/object:Gem::Version
4
- version: 2.1.0a9
4
+ version: 2.1.0b1
5
5
  platform: ruby
6
6
  authors:
7
7
  - Ribose Inc.