unicode-scripts 1.0.0 → 1.1.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -1
- data/README.md +56 -42
- data/data/scripts.marshal.gz +0 -0
- data/lib/unicode/scripts/constants.rb +2 -2
- data/unicode-scripts.gemspec +1 -1
- metadata +7 -8
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 666893d243411b8d0fb87f4aa33f8e1e4a2b3f2e
|
4
|
+
data.tar.gz: dd8e3e871b501213f3fdbda8ee91507782750fa0
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: efcb7a517a2ac21365468dcc5eab4781050197985b5f2f861a4aaf3ef32eb0926017e3347639c01ca94332ddb0f238f515ff4c06298a019a6c97e8d6b558e538
|
7
|
+
data.tar.gz: 186526edd7ccb980219869c3baf27863a90e1a2301f8d76229c1068d29c76e1c8eb3fe01633cfd175d4370fbf59a5b3a7a40dc5b4ea9c657b8ff44cc92257cbe
|
data/CHANGELOG.md
CHANGED
data/README.md
CHANGED
@@ -2,7 +2,7 @@
|
|
2
2
|
|
3
3
|
Retrieve the [Unicode script(s)](https://en.wikipedia.org/wiki/Script_%28Unicode%29) a string belongs to. Can also return the *Script_Extension* property which is defined as characters which are "commonly used with more than one script, but with a limited number of scripts".
|
4
4
|
|
5
|
-
Unicode version: **
|
5
|
+
Unicode version: **9.0.0**
|
6
6
|
|
7
7
|
Supported Rubies: **2.3**, **2.2**, **2.1**
|
8
8
|
|
@@ -52,10 +52,10 @@ puts Unicode::Scripts.names
|
|
52
52
|
|
53
53
|
# # # Output # # #
|
54
54
|
|
55
|
-
|
55
|
+
Adlam
|
56
56
|
Ahom
|
57
|
+
Anatolian_Hieroglyphs
|
57
58
|
Arabic
|
58
|
-
Imperial_Aramaic
|
59
59
|
Armenian
|
60
60
|
Avestan
|
61
61
|
Balinese
|
@@ -63,21 +63,25 @@ Bamum
|
|
63
63
|
Bassa_Vah
|
64
64
|
Batak
|
65
65
|
Bengali
|
66
|
+
Bhaiksuki
|
66
67
|
Bopomofo
|
67
68
|
Brahmi
|
68
69
|
Braille
|
69
70
|
Buginese
|
70
71
|
Buhid
|
71
|
-
Chakma
|
72
72
|
Canadian_Aboriginal
|
73
73
|
Carian
|
74
|
+
Caucasian_Albanian
|
75
|
+
Chakma
|
74
76
|
Cham
|
75
77
|
Cherokee
|
78
|
+
Common
|
76
79
|
Coptic
|
80
|
+
Cuneiform
|
77
81
|
Cypriot
|
78
82
|
Cyrillic
|
79
|
-
Devanagari
|
80
83
|
Deseret
|
84
|
+
Devanagari
|
81
85
|
Duployan
|
82
86
|
Egyptian_Hieroglyphs
|
83
87
|
Elbasan
|
@@ -89,26 +93,26 @@ Grantha
|
|
89
93
|
Greek
|
90
94
|
Gujarati
|
91
95
|
Gurmukhi
|
92
|
-
Hangul
|
93
96
|
Han
|
97
|
+
Hangul
|
94
98
|
Hanunoo
|
95
99
|
Hatran
|
96
100
|
Hebrew
|
97
101
|
Hiragana
|
98
|
-
|
99
|
-
|
100
|
-
|
101
|
-
|
102
|
-
Old_Italic
|
102
|
+
Imperial_Aramaic
|
103
|
+
Inherited
|
104
|
+
Inscriptional_Pahlavi
|
105
|
+
Inscriptional_Parthian
|
103
106
|
Javanese
|
104
|
-
|
107
|
+
Kaithi
|
108
|
+
Kannada
|
105
109
|
Katakana
|
110
|
+
Katakana_Or_Hiragana
|
111
|
+
Kayah_Li
|
106
112
|
Kharoshthi
|
107
113
|
Khmer
|
108
114
|
Khojki
|
109
|
-
|
110
|
-
Kaithi
|
111
|
-
Tai_Tham
|
115
|
+
Khudawadi
|
112
116
|
Lao
|
113
117
|
Latin
|
114
118
|
Lepcha
|
@@ -119,84 +123,87 @@ Lisu
|
|
119
123
|
Lycian
|
120
124
|
Lydian
|
121
125
|
Mahajani
|
126
|
+
Malayalam
|
122
127
|
Mandaic
|
123
128
|
Manichaean
|
129
|
+
Marchen
|
130
|
+
Meetei_Mayek
|
124
131
|
Mende_Kikakui
|
125
132
|
Meroitic_Cursive
|
126
133
|
Meroitic_Hieroglyphs
|
127
|
-
|
134
|
+
Miao
|
128
135
|
Modi
|
129
136
|
Mongolian
|
130
137
|
Mro
|
131
|
-
Meetei_Mayek
|
132
138
|
Multani
|
133
139
|
Myanmar
|
134
|
-
Old_North_Arabian
|
135
140
|
Nabataean
|
141
|
+
New_Tai_Lue
|
142
|
+
Newa
|
136
143
|
Nko
|
137
144
|
Ogham
|
138
145
|
Ol_Chiki
|
146
|
+
Old_Hungarian
|
147
|
+
Old_Italic
|
148
|
+
Old_North_Arabian
|
149
|
+
Old_Permic
|
150
|
+
Old_Persian
|
151
|
+
Old_South_Arabian
|
139
152
|
Old_Turkic
|
140
153
|
Oriya
|
154
|
+
Osage
|
141
155
|
Osmanya
|
156
|
+
Pahawh_Hmong
|
142
157
|
Palmyrene
|
143
158
|
Pau_Cin_Hau
|
144
|
-
Old_Permic
|
145
159
|
Phags_Pa
|
146
|
-
Inscriptional_Pahlavi
|
147
|
-
Psalter_Pahlavi
|
148
160
|
Phoenician
|
149
|
-
|
150
|
-
Inscriptional_Parthian
|
161
|
+
Psalter_Pahlavi
|
151
162
|
Rejang
|
152
163
|
Runic
|
153
164
|
Samaritan
|
154
|
-
Old_South_Arabian
|
155
165
|
Saurashtra
|
156
|
-
SignWriting
|
157
|
-
Shavian
|
158
166
|
Sharada
|
167
|
+
Shavian
|
159
168
|
Siddham
|
160
|
-
|
169
|
+
SignWriting
|
161
170
|
Sinhala
|
162
171
|
Sora_Sompeng
|
163
172
|
Sundanese
|
164
173
|
Syloti_Nagri
|
165
174
|
Syriac
|
175
|
+
Tagalog
|
166
176
|
Tagbanwa
|
167
|
-
Takri
|
168
177
|
Tai_Le
|
169
|
-
|
170
|
-
Tamil
|
178
|
+
Tai_Tham
|
171
179
|
Tai_Viet
|
180
|
+
Takri
|
181
|
+
Tamil
|
182
|
+
Tangut
|
172
183
|
Telugu
|
173
|
-
Tifinagh
|
174
|
-
Tagalog
|
175
184
|
Thaana
|
176
185
|
Thai
|
177
186
|
Tibetan
|
187
|
+
Tifinagh
|
178
188
|
Tirhuta
|
179
189
|
Ugaritic
|
190
|
+
Unknown
|
180
191
|
Vai
|
181
192
|
Warang_Citi
|
182
|
-
Old_Persian
|
183
|
-
Cuneiform
|
184
193
|
Yi
|
185
|
-
Inherited
|
186
|
-
Common
|
187
|
-
Unknown
|
188
194
|
```
|
189
195
|
|
190
|
-
### Script
|
196
|
+
### Short Script Names
|
191
197
|
|
192
|
-
You can extract all script
|
198
|
+
You can extract all 4 letter script names from the gem like this:
|
193
199
|
|
194
200
|
```ruby
|
195
201
|
require "unicode/scripts"
|
196
|
-
puts Unicode::Scripts.
|
202
|
+
puts Unicode::Scripts.names(format: :short)
|
197
203
|
|
198
204
|
# # # Output # # #
|
199
205
|
|
206
|
+
Adlm
|
200
207
|
Aghb
|
201
208
|
Ahom
|
202
209
|
Arab
|
@@ -208,6 +215,7 @@ Bamu
|
|
208
215
|
Bass
|
209
216
|
Batk
|
210
217
|
Beng
|
218
|
+
Bhks
|
211
219
|
Bopo
|
212
220
|
Brah
|
213
221
|
Brai
|
@@ -219,7 +227,6 @@ Cari
|
|
219
227
|
Cham
|
220
228
|
Cher
|
221
229
|
Copt
|
222
|
-
Qaac
|
223
230
|
Cprt
|
224
231
|
Cyrl
|
225
232
|
Deva
|
@@ -267,6 +274,7 @@ Lydi
|
|
267
274
|
Mahj
|
268
275
|
Mand
|
269
276
|
Mani
|
277
|
+
Marc
|
270
278
|
Mend
|
271
279
|
Merc
|
272
280
|
Mero
|
@@ -279,11 +287,13 @@ Mult
|
|
279
287
|
Mymr
|
280
288
|
Narb
|
281
289
|
Nbat
|
290
|
+
Newa
|
282
291
|
Nkoo
|
283
292
|
Ogam
|
284
293
|
Olck
|
285
294
|
Orkh
|
286
295
|
Orya
|
296
|
+
Osge
|
287
297
|
Osma
|
288
298
|
Palm
|
289
299
|
Pauc
|
@@ -294,6 +304,8 @@ Phlp
|
|
294
304
|
Phnx
|
295
305
|
Plrd
|
296
306
|
Prti
|
307
|
+
Qaac
|
308
|
+
Qaai
|
297
309
|
Rjng
|
298
310
|
Runr
|
299
311
|
Samr
|
@@ -314,6 +326,7 @@ Takr
|
|
314
326
|
Tale
|
315
327
|
Talu
|
316
328
|
Taml
|
329
|
+
Tang
|
317
330
|
Tavt
|
318
331
|
Telu
|
319
332
|
Tfng
|
@@ -329,11 +342,12 @@ Xpeo
|
|
329
342
|
Xsux
|
330
343
|
Yiii
|
331
344
|
Zinh
|
332
|
-
Qaai
|
333
345
|
Zyyy
|
334
346
|
Zzzz
|
335
347
|
```
|
336
348
|
|
349
|
+
See [unicode-x](https://github.com/janlelis/unicode-x) for more Unicode related micro libraries.
|
350
|
+
|
337
351
|
## MIT License
|
338
352
|
|
339
353
|
- Copyright (C) 2016 Jan Lelis <http://janlelis.com>. Released under the MIT license.
|
data/data/scripts.marshal.gz
CHANGED
Binary file
|
@@ -1,7 +1,7 @@
|
|
1
1
|
module Unicode
|
2
2
|
module Scripts
|
3
|
-
VERSION = "1.
|
4
|
-
UNICODE_VERSION = "
|
3
|
+
VERSION = "1.1.0".freeze
|
4
|
+
UNICODE_VERSION = "9.0.0".freeze
|
5
5
|
DATA_DIRECTORY = File.expand_path(File.dirname(__FILE__) + '/../../../data/').freeze
|
6
6
|
INDEX_FILENAME = (DATA_DIRECTORY + '/scripts.marshal.gz').freeze
|
7
7
|
end
|
data/unicode-scripts.gemspec
CHANGED
@@ -6,7 +6,7 @@ Gem::Specification.new do |gem|
|
|
6
6
|
gem.name = "unicode-scripts"
|
7
7
|
gem.version = Unicode::Scripts::VERSION
|
8
8
|
gem.summary = "Which script(s) does a Unicode string belong to?"
|
9
|
-
gem.description = "[Unicode
|
9
|
+
gem.description = "[Unicode #{Unicode::Scripts::UNICODE_VERSION}] Retrieve the Unicode script(s) a string belongs to. Can also return the Script_Extension property which is defined as characters which are 'commonly used with more than one script, but with a limited number of scripts'. "
|
10
10
|
gem.authors = ["Jan Lelis"]
|
11
11
|
gem.email = ["mail@janlelis.de"]
|
12
12
|
gem.homepage = "https://github.com/janlelis/unicode-scripts"
|
metadata
CHANGED
@@ -1,19 +1,18 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: unicode-scripts
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.1.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Jan Lelis
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2016-
|
11
|
+
date: 2016-06-22 00:00:00.000000000 Z
|
12
12
|
dependencies: []
|
13
|
-
description: "[Unicode
|
14
|
-
|
15
|
-
|
16
|
-
scripts'. "
|
13
|
+
description: "[Unicode 9.0.0] Retrieve the Unicode script(s) a string belongs to.
|
14
|
+
Can also return the Script_Extension property which is defined as characters which
|
15
|
+
are 'commonly used with more than one script, but with a limited number of scripts'. "
|
17
16
|
email:
|
18
17
|
- mail@janlelis.de
|
19
18
|
executables: []
|
@@ -25,6 +24,7 @@ files:
|
|
25
24
|
- CHANGELOG.md
|
26
25
|
- CODE_OF_CONDUCT.md
|
27
26
|
- Gemfile
|
27
|
+
- Gemfile.lock
|
28
28
|
- MIT-LICENSE.txt
|
29
29
|
- README.md
|
30
30
|
- Rakefile
|
@@ -55,10 +55,9 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
55
55
|
version: '0'
|
56
56
|
requirements: []
|
57
57
|
rubyforge_project:
|
58
|
-
rubygems_version: 2.
|
58
|
+
rubygems_version: 2.5.1
|
59
59
|
signing_key:
|
60
60
|
specification_version: 4
|
61
61
|
summary: Which script(s) does a Unicode string belong to?
|
62
62
|
test_files:
|
63
63
|
- spec/unicode_scripts_spec.rb
|
64
|
-
has_rdoc:
|