regexp_property_values 1.2.0 → 1.4.0

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 6ce99d3efe4e87c82e59b220f8b8b317edb00f971dd82427bbd73ddfbcaa05ae
4
- data.tar.gz: e3499f430a59db35346f84b708a4aaceedaa8ecdb5dc25b075666b5ff110be4e
3
+ metadata.gz: 3e530cc9c245b9a0295f3f4d155ba9cdb32d2d105c8e6beae6f59771eee8e862
4
+ data.tar.gz: 295197787f2ca187ac8a0ca57eebd1551cf8a243389a107d66fcedb49bc7f792
5
5
  SHA512:
6
- metadata.gz: 9bc766948aa42da07f0e2c2aabee929139e7fe052d2b28ec117ed923e50b25bd8b7214c58f0aeaf08f52c05d8bdc4d613c6b1d70796344eff064fa793c5bb2ae
7
- data.tar.gz: 84256ff9ee3de75f56d2dd6d31ee0f1096ebd28d97fd8f52e085452d550bd53122cf3baaaeac8d7903b6515b659083b478dcb3b81946825472fba73b43605a07
6
+ metadata.gz: 5879eb2ec3999b46aa8fa66340b0d22704f828328285625670ef8bf2e67e1b10162dd89149ff9950f3842bab0f1978f7975fba0a5bdacb0085e3c9bc070afbf5
7
+ data.tar.gz: af154b78b8a44ef2ef7fe988d47564c565ab6e4e1a03ca2bc7a0c1951ef556c2ae6f054fa98fdfb775cb34b2a36913cfa6621dc883a44b533290a50dd4861daa
data/CHANGELOG.md CHANGED
@@ -4,6 +4,16 @@ All notable changes to this project will be documented in this file.
4
4
  The format is based on [Keep a Changelog](http://keepachangelog.com/en/1.0.0/)
5
5
  and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.html).
6
6
 
7
+ ## [1.4.0] - 2023-06-10
8
+
9
+ ### Added
10
+ - new properties of Ruby 3.2 / Unicode 15.0
11
+
12
+ ## [1.3.0] - 2022-04-07
13
+
14
+ ### Added
15
+ - new properties of Ruby 3.2 / Unicode 14.0
16
+
7
17
  ## [1.2.0] - 2021-12-31
8
18
 
9
19
  ### Added
data/Rakefile CHANGED
@@ -32,3 +32,9 @@ if RUBY_PLATFORM !~ /java/i
32
32
  # recompile before running specs
33
33
  task(:spec).enhance([:compile])
34
34
  end
35
+
36
+ desc 'Update property lists'
37
+ task :update do
38
+ require_relative 'lib/regexp_property_values'
39
+ RegexpPropertyValues.update
40
+ end
data/lib/aliases CHANGED
@@ -35,6 +35,7 @@ Cn;Unassigned
35
35
  Co;Private_Use
36
36
  Combining_Mark;Mark
37
37
  Copt;Coptic
38
+ Cpmn;Cypro_Minoan
38
39
  Cprt;Cypriot
39
40
  Cs;Surrogate
40
41
  Cyrl;Cyrillic
@@ -132,6 +133,7 @@ Mult;Multani
132
133
  Mymr;Myanmar
133
134
  N;Number
134
135
  NChar;Noncharacter_Code_Point
136
+ Nagm;Nag_Mundari
135
137
  Nand;Nandinagari
136
138
  Narb;Old_North_Arabian
137
139
  Nbat;Nabataean
@@ -154,6 +156,7 @@ Orkh;Old_Turkic
154
156
  Orya;Oriya
155
157
  Osge;Osage
156
158
  Osma;Osmanya
159
+ Ougr;Old_Uyghur
157
160
  P;Punctuation
158
161
  PCM;Prepended_Concatenation_Mark
159
162
  Palm;Palmyrene
@@ -218,10 +221,12 @@ Tglg;Tagalog
218
221
  Thaa;Thaana
219
222
  Tibt;Tibetan
220
223
  Tirh;Tirhuta
224
+ Tnsa;Tangsa
221
225
  UIdeo;Unified_Ideograph
222
226
  Ugar;Ugaritic
223
227
  VS;Variation_Selector
224
228
  Vaii;Vai
229
+ Vith;Vithkuqi
225
230
  WSpace;White_Space
226
231
  Wara;Warang_Citi
227
232
  Wcho;Wancho
@@ -5,7 +5,7 @@ module RegexpPropertyValues
5
5
  require 'fileutils'
6
6
  require 'set'
7
7
 
8
- BASE_URL = 'http://www.unicode.org/Public'
8
+ BASE_URL = 'https://www.unicode.org/Public/UCD/latest/ucd'
9
9
 
10
10
  UCD_FILES = %w[
11
11
  Blocks.txt
@@ -38,26 +38,11 @@ module RegexpPropertyValues
38
38
  end
39
39
 
40
40
  def download_ucd_files(ucd_path: nil, emoji_path: nil)
41
- unicode_version = RbConfig::CONFIG.fetch('UNICODE_VERSION')
42
- emoji_version = RbConfig::CONFIG.fetch('UNICODE_EMOJI_VERSION')
43
-
44
- ucd_path ||= ENV['RPV_UCD_PATH']
45
- emoji_path ||= ENV['RPV_EMOJI_PATH']
46
-
47
- if ucd_path.nil? && emoji_path.nil?
48
- puts <<-EOS.gsub(/\n */, ' ')
49
- This try will load ucd and emoji data for the CURRENT RUBY (
50
- (#{RUBY_VERSION} - ucd #{unicode_version}, emoji #{emoji_version}).
51
- Run this on the latest Ruby version you want to support.
52
- Unicode directory structure changes sometimes, so you might need to
53
- pass the right path(s) as keyword args or ENV vars. Continue? [y/n]'
54
- EOS
55
-
56
- return puts 'download skipped.' unless $stdin.gets =~ /^y/i
57
- end
41
+ puts 'This will try to load the latest UCD data. Continue? [y/n]'
42
+ return puts 'download skipped.' unless $stdin.gets =~ /^y/i
58
43
 
59
- ucd_path ||= "#{BASE_URL}/#{unicode_version}/ucd"
60
- emoji_path ||= "#{BASE_URL}/emoji/#{emoji_version}"
44
+ ucd_path ||= ENV['RPV_UCD_PATH'] || BASE_URL
45
+ emoji_path ||= ENV['RPV_EMOJI_PATH'] || "#{BASE_URL}/emoji/"
61
46
 
62
47
  Dir.chdir(TMP_DIR) do
63
48
  UCD_FILES.each { |f| `wget #{ucd_path}/#{f}` }
@@ -76,7 +61,9 @@ module RegexpPropertyValues
76
61
  ]
77
62
 
78
63
  # special properties
79
- @values += %w[Any Assigned In_No_Block Unknown]
64
+ @values += %w[
65
+ Any Assigned Extended_Pictographic In_No_Block Unknown
66
+ ]
80
67
 
81
68
  # legacy properties
82
69
  @values += %w[Newline]
@@ -1,3 +1,3 @@
1
1
  module RegexpPropertyValues
2
- VERSION = '1.2.0'
2
+ VERSION = '1.4.0'
3
3
  end
data/lib/values CHANGED
@@ -7,6 +7,8 @@ Age=11.0
7
7
  Age=12.0
8
8
  Age=12.1
9
9
  Age=13.0
10
+ Age=14.0
11
+ Age=15.0
10
12
  Age=2.0
11
13
  Age=2.1
12
14
  Age=3.0
@@ -71,6 +73,7 @@ Coptic
71
73
  Cuneiform
72
74
  Currency_Symbol
73
75
  Cypriot
76
+ Cypro_Minoan
74
77
  Cyrillic
75
78
  Dash
76
79
  Dash_Punctuation
@@ -94,6 +97,7 @@ Emoji_Modifier_Base
94
97
  Emoji_Presentation
95
98
  Enclosing_Mark
96
99
  Ethiopic
100
+ Extended_Pictographic
97
101
  Extender
98
102
  Final_Punctuation
99
103
  Format
@@ -135,6 +139,8 @@ In_Ancient_Greek_Numbers
135
139
  In_Ancient_Symbols
136
140
  In_Arabic
137
141
  In_Arabic_Extended_A
142
+ In_Arabic_Extended_B
143
+ In_Arabic_Extended_C
138
144
  In_Arabic_Mathematical_Alphabetic_Symbols
139
145
  In_Arabic_Presentation_Forms_A
140
146
  In_Arabic_Presentation_Forms_B
@@ -174,6 +180,7 @@ In_CJK_Unified_Ideographs_Extension_D
174
180
  In_CJK_Unified_Ideographs_Extension_E
175
181
  In_CJK_Unified_Ideographs_Extension_F
176
182
  In_CJK_Unified_Ideographs_Extension_G
183
+ In_CJK_Unified_Ideographs_Extension_H
177
184
  In_Carian
178
185
  In_Caucasian_Albanian
179
186
  In_Chakma
@@ -196,14 +203,17 @@ In_Cuneiform
196
203
  In_Cuneiform_Numbers_and_Punctuation
197
204
  In_Currency_Symbols
198
205
  In_Cypriot_Syllabary
206
+ In_Cypro_Minoan
199
207
  In_Cyrillic
200
208
  In_Cyrillic_Extended_A
201
209
  In_Cyrillic_Extended_B
202
210
  In_Cyrillic_Extended_C
211
+ In_Cyrillic_Extended_D
203
212
  In_Cyrillic_Supplement
204
213
  In_Deseret
205
214
  In_Devanagari
206
215
  In_Devanagari_Extended
216
+ In_Devanagari_Extended_A
207
217
  In_Dingbats
208
218
  In_Dives_Akuru
209
219
  In_Dogra
@@ -222,6 +232,7 @@ In_Enclosed_Ideographic_Supplement
222
232
  In_Ethiopic
223
233
  In_Ethiopic_Extended
224
234
  In_Ethiopic_Extended_A
235
+ In_Ethiopic_Extended_B
225
236
  In_Ethiopic_Supplement
226
237
  In_General_Punctuation
227
238
  In_Geometric_Shapes
@@ -260,13 +271,16 @@ In_Inscriptional_Pahlavi
260
271
  In_Inscriptional_Parthian
261
272
  In_Javanese
262
273
  In_Kaithi
274
+ In_Kaktovik_Numerals
263
275
  In_Kana_Extended_A
276
+ In_Kana_Extended_B
264
277
  In_Kana_Supplement
265
278
  In_Kanbun
266
279
  In_Kangxi_Radicals
267
280
  In_Kannada
268
281
  In_Katakana
269
282
  In_Katakana_Phonetic_Extensions
283
+ In_Kawi
270
284
  In_Kayah_Li
271
285
  In_Kharoshthi
272
286
  In_Khitan_Small_Script
@@ -282,6 +296,8 @@ In_Latin_Extended_B
282
296
  In_Latin_Extended_C
283
297
  In_Latin_Extended_D
284
298
  In_Latin_Extended_E
299
+ In_Latin_Extended_F
300
+ In_Latin_Extended_G
285
301
  In_Lepcha
286
302
  In_Letterlike_Symbols
287
303
  In_Limbu
@@ -329,6 +345,7 @@ In_Myanmar_Extended_A
329
345
  In_Myanmar_Extended_B
330
346
  In_NKo
331
347
  In_Nabataean
348
+ In_Nag_Mundari
332
349
  In_Nandinagari
333
350
  In_New_Tai_Lue
334
351
  In_Newa
@@ -346,6 +363,7 @@ In_Old_Persian
346
363
  In_Old_Sogdian
347
364
  In_Old_South_Arabian
348
365
  In_Old_Turkic
366
+ In_Old_Uyghur
349
367
  In_Optical_Character_Recognition
350
368
  In_Oriya
351
369
  In_Ornamental_Dingbats
@@ -408,6 +426,7 @@ In_Tai_Xuan_Jing_Symbols
408
426
  In_Takri
409
427
  In_Tamil
410
428
  In_Tamil_Supplement
429
+ In_Tangsa
411
430
  In_Tangut
412
431
  In_Tangut_Components
413
432
  In_Tangut_Supplement
@@ -417,15 +436,18 @@ In_Thai
417
436
  In_Tibetan
418
437
  In_Tifinagh
419
438
  In_Tirhuta
439
+ In_Toto
420
440
  In_Transport_and_Map_Symbols
421
441
  In_Ugaritic
422
442
  In_Unified_Canadian_Aboriginal_Syllabics
423
443
  In_Unified_Canadian_Aboriginal_Syllabics_Extended
444
+ In_Unified_Canadian_Aboriginal_Syllabics_Extended_A
424
445
  In_Vai
425
446
  In_Variation_Selectors
426
447
  In_Variation_Selectors_Supplement
427
448
  In_Vedic_Extensions
428
449
  In_Vertical_Forms
450
+ In_Vithkuqi
429
451
  In_Wancho
430
452
  In_Warang_Citi
431
453
  In_Yezidi
@@ -433,6 +455,7 @@ In_Yi_Radicals
433
455
  In_Yi_Syllables
434
456
  In_Yijing_Hexagram_Symbols
435
457
  In_Zanabazar_Square
458
+ In_Znamenny_Musical_Notation
436
459
  Inherited
437
460
  Initial_Punctuation
438
461
  Inscriptional_Pahlavi
@@ -442,6 +465,7 @@ Join_Control
442
465
  Kaithi
443
466
  Kannada
444
467
  Katakana
468
+ Kawi
445
469
  Kayah_Li
446
470
  Kharoshthi
447
471
  Khitan_Small_Script
@@ -488,6 +512,7 @@ Mro
488
512
  Multani
489
513
  Myanmar
490
514
  Nabataean
515
+ Nag_Mundari
491
516
  Nandinagari
492
517
  New_Tai_Lue
493
518
  Newa
@@ -508,6 +533,7 @@ Old_Persian
508
533
  Old_Sogdian
509
534
  Old_South_Arabian
510
535
  Old_Turkic
536
+ Old_Uyghur
511
537
  Open_Punctuation
512
538
  Oriya
513
539
  Osage
@@ -572,6 +598,7 @@ Tai_Tham
572
598
  Tai_Viet
573
599
  Takri
574
600
  Tamil
601
+ Tangsa
575
602
  Tangut
576
603
  Telugu
577
604
  Terminal_Punctuation
@@ -581,6 +608,7 @@ Tibetan
581
608
  Tifinagh
582
609
  Tirhuta
583
610
  Titlecase_Letter
611
+ Toto
584
612
  Ugaritic
585
613
  Unassigned
586
614
  Unified_Ideograph
@@ -590,6 +618,7 @@ Uppercase
590
618
  Uppercase_Letter
591
619
  Vai
592
620
  Variation_Selector
621
+ Vithkuqi
593
622
  Wancho
594
623
  Warang_Citi
595
624
  White_Space
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: regexp_property_values
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.2.0
4
+ version: 1.4.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Janosch Müller
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2021-12-31 00:00:00.000000000 Z
11
+ date: 2023-06-10 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description: This small library lets you see which property values are supported by
14
14
  the regular expression engine of the Ruby version you are running, and what they
@@ -61,7 +61,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
61
61
  - !ruby/object:Gem::Version
62
62
  version: '0'
63
63
  requirements: []
64
- rubygems_version: 3.3.0.dev
64
+ rubygems_version: 3.4.10
65
65
  signing_key:
66
66
  specification_version: 4
67
67
  summary: Inspect property values supported by Ruby's regex engine