unicode-scripts 1.0.0 → 1.1.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +5 -1
- data/README.md +56 -42
- data/data/scripts.marshal.gz +0 -0
- data/lib/unicode/scripts/constants.rb +2 -2
- data/unicode-scripts.gemspec +1 -1
- metadata +7 -8
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA1:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 666893d243411b8d0fb87f4aa33f8e1e4a2b3f2e
|
4
|
+
data.tar.gz: dd8e3e871b501213f3fdbda8ee91507782750fa0
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: efcb7a517a2ac21365468dcc5eab4781050197985b5f2f861a4aaf3ef32eb0926017e3347639c01ca94332ddb0f238f515ff4c06298a019a6c97e8d6b558e538
|
7
|
+
data.tar.gz: 186526edd7ccb980219869c3baf27863a90e1a2301f8d76229c1068d29c76e1c8eb3fe01633cfd175d4370fbf59a5b3a7a40dc5b4ea9c657b8ff44cc92257cbe
|
data/CHANGELOG.md
CHANGED
data/README.md
CHANGED
@@ -2,7 +2,7 @@
|
|
2
2
|
|
3
3
|
Retrieve the [Unicode script(s)](https://en.wikipedia.org/wiki/Script_%28Unicode%29) a string belongs to. Can also return the *Script_Extension* property which is defined as characters which are "commonly used with more than one script, but with a limited number of scripts".
|
4
4
|
|
5
|
-
Unicode version: **
|
5
|
+
Unicode version: **9.0.0**
|
6
6
|
|
7
7
|
Supported Rubies: **2.3**, **2.2**, **2.1**
|
8
8
|
|
@@ -52,10 +52,10 @@ puts Unicode::Scripts.names
|
|
52
52
|
|
53
53
|
# # # Output # # #
|
54
54
|
|
55
|
-
|
55
|
+
Adlam
|
56
56
|
Ahom
|
57
|
+
Anatolian_Hieroglyphs
|
57
58
|
Arabic
|
58
|
-
Imperial_Aramaic
|
59
59
|
Armenian
|
60
60
|
Avestan
|
61
61
|
Balinese
|
@@ -63,21 +63,25 @@ Bamum
|
|
63
63
|
Bassa_Vah
|
64
64
|
Batak
|
65
65
|
Bengali
|
66
|
+
Bhaiksuki
|
66
67
|
Bopomofo
|
67
68
|
Brahmi
|
68
69
|
Braille
|
69
70
|
Buginese
|
70
71
|
Buhid
|
71
|
-
Chakma
|
72
72
|
Canadian_Aboriginal
|
73
73
|
Carian
|
74
|
+
Caucasian_Albanian
|
75
|
+
Chakma
|
74
76
|
Cham
|
75
77
|
Cherokee
|
78
|
+
Common
|
76
79
|
Coptic
|
80
|
+
Cuneiform
|
77
81
|
Cypriot
|
78
82
|
Cyrillic
|
79
|
-
Devanagari
|
80
83
|
Deseret
|
84
|
+
Devanagari
|
81
85
|
Duployan
|
82
86
|
Egyptian_Hieroglyphs
|
83
87
|
Elbasan
|
@@ -89,26 +93,26 @@ Grantha
|
|
89
93
|
Greek
|
90
94
|
Gujarati
|
91
95
|
Gurmukhi
|
92
|
-
Hangul
|
93
96
|
Han
|
97
|
+
Hangul
|
94
98
|
Hanunoo
|
95
99
|
Hatran
|
96
100
|
Hebrew
|
97
101
|
Hiragana
|
98
|
-
|
99
|
-
|
100
|
-
|
101
|
-
|
102
|
-
Old_Italic
|
102
|
+
Imperial_Aramaic
|
103
|
+
Inherited
|
104
|
+
Inscriptional_Pahlavi
|
105
|
+
Inscriptional_Parthian
|
103
106
|
Javanese
|
104
|
-
|
107
|
+
Kaithi
|
108
|
+
Kannada
|
105
109
|
Katakana
|
110
|
+
Katakana_Or_Hiragana
|
111
|
+
Kayah_Li
|
106
112
|
Kharoshthi
|
107
113
|
Khmer
|
108
114
|
Khojki
|
109
|
-
|
110
|
-
Kaithi
|
111
|
-
Tai_Tham
|
115
|
+
Khudawadi
|
112
116
|
Lao
|
113
117
|
Latin
|
114
118
|
Lepcha
|
@@ -119,84 +123,87 @@ Lisu
|
|
119
123
|
Lycian
|
120
124
|
Lydian
|
121
125
|
Mahajani
|
126
|
+
Malayalam
|
122
127
|
Mandaic
|
123
128
|
Manichaean
|
129
|
+
Marchen
|
130
|
+
Meetei_Mayek
|
124
131
|
Mende_Kikakui
|
125
132
|
Meroitic_Cursive
|
126
133
|
Meroitic_Hieroglyphs
|
127
|
-
|
134
|
+
Miao
|
128
135
|
Modi
|
129
136
|
Mongolian
|
130
137
|
Mro
|
131
|
-
Meetei_Mayek
|
132
138
|
Multani
|
133
139
|
Myanmar
|
134
|
-
Old_North_Arabian
|
135
140
|
Nabataean
|
141
|
+
New_Tai_Lue
|
142
|
+
Newa
|
136
143
|
Nko
|
137
144
|
Ogham
|
138
145
|
Ol_Chiki
|
146
|
+
Old_Hungarian
|
147
|
+
Old_Italic
|
148
|
+
Old_North_Arabian
|
149
|
+
Old_Permic
|
150
|
+
Old_Persian
|
151
|
+
Old_South_Arabian
|
139
152
|
Old_Turkic
|
140
153
|
Oriya
|
154
|
+
Osage
|
141
155
|
Osmanya
|
156
|
+
Pahawh_Hmong
|
142
157
|
Palmyrene
|
143
158
|
Pau_Cin_Hau
|
144
|
-
Old_Permic
|
145
159
|
Phags_Pa
|
146
|
-
Inscriptional_Pahlavi
|
147
|
-
Psalter_Pahlavi
|
148
160
|
Phoenician
|
149
|
-
|
150
|
-
Inscriptional_Parthian
|
161
|
+
Psalter_Pahlavi
|
151
162
|
Rejang
|
152
163
|
Runic
|
153
164
|
Samaritan
|
154
|
-
Old_South_Arabian
|
155
165
|
Saurashtra
|
156
|
-
SignWriting
|
157
|
-
Shavian
|
158
166
|
Sharada
|
167
|
+
Shavian
|
159
168
|
Siddham
|
160
|
-
|
169
|
+
SignWriting
|
161
170
|
Sinhala
|
162
171
|
Sora_Sompeng
|
163
172
|
Sundanese
|
164
173
|
Syloti_Nagri
|
165
174
|
Syriac
|
175
|
+
Tagalog
|
166
176
|
Tagbanwa
|
167
|
-
Takri
|
168
177
|
Tai_Le
|
169
|
-
|
170
|
-
Tamil
|
178
|
+
Tai_Tham
|
171
179
|
Tai_Viet
|
180
|
+
Takri
|
181
|
+
Tamil
|
182
|
+
Tangut
|
172
183
|
Telugu
|
173
|
-
Tifinagh
|
174
|
-
Tagalog
|
175
184
|
Thaana
|
176
185
|
Thai
|
177
186
|
Tibetan
|
187
|
+
Tifinagh
|
178
188
|
Tirhuta
|
179
189
|
Ugaritic
|
190
|
+
Unknown
|
180
191
|
Vai
|
181
192
|
Warang_Citi
|
182
|
-
Old_Persian
|
183
|
-
Cuneiform
|
184
193
|
Yi
|
185
|
-
Inherited
|
186
|
-
Common
|
187
|
-
Unknown
|
188
194
|
```
|
189
195
|
|
190
|
-
### Script
|
196
|
+
### Short Script Names
|
191
197
|
|
192
|
-
You can extract all script
|
198
|
+
You can extract all 4 letter script names from the gem like this:
|
193
199
|
|
194
200
|
```ruby
|
195
201
|
require "unicode/scripts"
|
196
|
-
puts Unicode::Scripts.
|
202
|
+
puts Unicode::Scripts.names(format: :short)
|
197
203
|
|
198
204
|
# # # Output # # #
|
199
205
|
|
206
|
+
Adlm
|
200
207
|
Aghb
|
201
208
|
Ahom
|
202
209
|
Arab
|
@@ -208,6 +215,7 @@ Bamu
|
|
208
215
|
Bass
|
209
216
|
Batk
|
210
217
|
Beng
|
218
|
+
Bhks
|
211
219
|
Bopo
|
212
220
|
Brah
|
213
221
|
Brai
|
@@ -219,7 +227,6 @@ Cari
|
|
219
227
|
Cham
|
220
228
|
Cher
|
221
229
|
Copt
|
222
|
-
Qaac
|
223
230
|
Cprt
|
224
231
|
Cyrl
|
225
232
|
Deva
|
@@ -267,6 +274,7 @@ Lydi
|
|
267
274
|
Mahj
|
268
275
|
Mand
|
269
276
|
Mani
|
277
|
+
Marc
|
270
278
|
Mend
|
271
279
|
Merc
|
272
280
|
Mero
|
@@ -279,11 +287,13 @@ Mult
|
|
279
287
|
Mymr
|
280
288
|
Narb
|
281
289
|
Nbat
|
290
|
+
Newa
|
282
291
|
Nkoo
|
283
292
|
Ogam
|
284
293
|
Olck
|
285
294
|
Orkh
|
286
295
|
Orya
|
296
|
+
Osge
|
287
297
|
Osma
|
288
298
|
Palm
|
289
299
|
Pauc
|
@@ -294,6 +304,8 @@ Phlp
|
|
294
304
|
Phnx
|
295
305
|
Plrd
|
296
306
|
Prti
|
307
|
+
Qaac
|
308
|
+
Qaai
|
297
309
|
Rjng
|
298
310
|
Runr
|
299
311
|
Samr
|
@@ -314,6 +326,7 @@ Takr
|
|
314
326
|
Tale
|
315
327
|
Talu
|
316
328
|
Taml
|
329
|
+
Tang
|
317
330
|
Tavt
|
318
331
|
Telu
|
319
332
|
Tfng
|
@@ -329,11 +342,12 @@ Xpeo
|
|
329
342
|
Xsux
|
330
343
|
Yiii
|
331
344
|
Zinh
|
332
|
-
Qaai
|
333
345
|
Zyyy
|
334
346
|
Zzzz
|
335
347
|
```
|
336
348
|
|
349
|
+
See [unicode-x](https://github.com/janlelis/unicode-x) for more Unicode related micro libraries.
|
350
|
+
|
337
351
|
## MIT License
|
338
352
|
|
339
353
|
- Copyright (C) 2016 Jan Lelis <http://janlelis.com>. Released under the MIT license.
|
data/data/scripts.marshal.gz
CHANGED
Binary file
|
@@ -1,7 +1,7 @@
|
|
1
1
|
module Unicode
|
2
2
|
module Scripts
|
3
|
-
VERSION = "1.
|
4
|
-
UNICODE_VERSION = "
|
3
|
+
VERSION = "1.1.0".freeze
|
4
|
+
UNICODE_VERSION = "9.0.0".freeze
|
5
5
|
DATA_DIRECTORY = File.expand_path(File.dirname(__FILE__) + '/../../../data/').freeze
|
6
6
|
INDEX_FILENAME = (DATA_DIRECTORY + '/scripts.marshal.gz').freeze
|
7
7
|
end
|
data/unicode-scripts.gemspec
CHANGED
@@ -6,7 +6,7 @@ Gem::Specification.new do |gem|
|
|
6
6
|
gem.name = "unicode-scripts"
|
7
7
|
gem.version = Unicode::Scripts::VERSION
|
8
8
|
gem.summary = "Which script(s) does a Unicode string belong to?"
|
9
|
-
gem.description = "[Unicode
|
9
|
+
gem.description = "[Unicode #{Unicode::Scripts::UNICODE_VERSION}] Retrieve the Unicode script(s) a string belongs to. Can also return the Script_Extension property which is defined as characters which are 'commonly used with more than one script, but with a limited number of scripts'. "
|
10
10
|
gem.authors = ["Jan Lelis"]
|
11
11
|
gem.email = ["mail@janlelis.de"]
|
12
12
|
gem.homepage = "https://github.com/janlelis/unicode-scripts"
|
metadata
CHANGED
@@ -1,19 +1,18 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: unicode-scripts
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 1.
|
4
|
+
version: 1.1.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Jan Lelis
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2016-
|
11
|
+
date: 2016-06-22 00:00:00.000000000 Z
|
12
12
|
dependencies: []
|
13
|
-
description: "[Unicode
|
14
|
-
|
15
|
-
|
16
|
-
scripts'. "
|
13
|
+
description: "[Unicode 9.0.0] Retrieve the Unicode script(s) a string belongs to.
|
14
|
+
Can also return the Script_Extension property which is defined as characters which
|
15
|
+
are 'commonly used with more than one script, but with a limited number of scripts'. "
|
17
16
|
email:
|
18
17
|
- mail@janlelis.de
|
19
18
|
executables: []
|
@@ -25,6 +24,7 @@ files:
|
|
25
24
|
- CHANGELOG.md
|
26
25
|
- CODE_OF_CONDUCT.md
|
27
26
|
- Gemfile
|
27
|
+
- Gemfile.lock
|
28
28
|
- MIT-LICENSE.txt
|
29
29
|
- README.md
|
30
30
|
- Rakefile
|
@@ -55,10 +55,9 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
55
55
|
version: '0'
|
56
56
|
requirements: []
|
57
57
|
rubyforge_project:
|
58
|
-
rubygems_version: 2.
|
58
|
+
rubygems_version: 2.5.1
|
59
59
|
signing_key:
|
60
60
|
specification_version: 4
|
61
61
|
summary: Which script(s) does a Unicode string belong to?
|
62
62
|
test_files:
|
63
63
|
- spec/unicode_scripts_spec.rb
|
64
|
-
has_rdoc:
|