tokenizers 0.5.3-x64-mingw-ucrt → 0.5.4-x64-mingw-ucrt

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 2575d80ae3967271482554c3a2e871dca95ce6545864a0222ac8571cd52aa5c9
4
- data.tar.gz: 1970e935847b5ff6c2f4fa87ee0219796e1734eb8e777fca6f2a4c7c46108022
3
+ metadata.gz: c6bb67a2361bc8e34a9561f9b5d6afa684f9315e2a24a21519ede0e0143d4545
4
+ data.tar.gz: 3835ac6ca9ac2a2fc50b351c97663a870344a995b1bf68920a2c289f236c5568
5
5
  SHA512:
6
- metadata.gz: 83c10038a44a00931c296cc6549cf5a1614446a094bfb9a87923fa57361e4c5eadfc52b81e27edfcd32d3b9e3ca8dde9d4a40d84df9c1844b16826a936784373
7
- data.tar.gz: 6d7659d3928d03ffeb20632d3d0c44a34cda7882a96963e22d6e009b15c8c2935f3e45e879a515569b71e7dc524c5143b5220d76af46f322213399a94269c59f
6
+ metadata.gz: de40170d02d6359ba3f53b8e8a53c552af7618654045f4888c6eb44e06c28b6ce7df99c0b31acb3c8da4bea566e4515973d43fb5fd01cde3a3c68c05f675e3b2
7
+ data.tar.gz: '082ae45456ce3543afbb3f551d21df793b3fdf23f60705c12bf9a0a1be71a8ef28d903cdebb41e1d66e5453c919f41db21cb757a4e8f2940ebff555d8623a1f2'
data/CHANGELOG.md CHANGED
@@ -1,3 +1,8 @@
1
+ ## 0.5.4 (2024-12-28)
2
+
3
+ - Updated Tokenizers to 0.21.0
4
+ - Added support for Ruby 3.4
5
+
1
6
  ## 0.5.3 (2024-09-17)
2
7
 
3
8
  - Added `AddedToken` class
data/Cargo.lock CHANGED
@@ -19,9 +19,9 @@ checksum = "9e1b586273c5702936fe7b7d6896644d8be71e6314cfe09d3167c95f712589e8"
19
19
 
20
20
  [[package]]
21
21
  name = "bindgen"
22
- version = "0.69.4"
22
+ version = "0.69.5"
23
23
  source = "registry+https://github.com/rust-lang/crates.io-index"
24
- checksum = "a00dc851838a2120612785d195287475a3ac45514741da670b735818822129a0"
24
+ checksum = "271383c67ccabffb7381723dea0672a673f292304fcb45c01cc648c7a8d58088"
25
25
  dependencies = [
26
26
  "bitflags 2.6.0",
27
27
  "cexpr",
@@ -49,6 +49,12 @@ version = "2.6.0"
49
49
  source = "registry+https://github.com/rust-lang/crates.io-index"
50
50
  checksum = "b048fb63fd8b5923fc5aa7b340d8e156aec7ec02f0c78fa8a6ddc2613f6f71de"
51
51
 
52
+ [[package]]
53
+ name = "bumpalo"
54
+ version = "3.16.0"
55
+ source = "registry+https://github.com/rust-lang/crates.io-index"
56
+ checksum = "79296716171880943b8470b5f8d03aa55eb2e645a4874bdbb28adb49162e012c"
57
+
52
58
  [[package]]
53
59
  name = "byteorder"
54
60
  version = "1.5.0"
@@ -57,9 +63,9 @@ checksum = "1fd0f2584146f6f2ef48085050886acf353beff7305ebd1ae69500e27c67f64b"
57
63
 
58
64
  [[package]]
59
65
  name = "cc"
60
- version = "1.1.15"
66
+ version = "1.2.6"
61
67
  source = "registry+https://github.com/rust-lang/crates.io-index"
62
- checksum = "57b6a275aa2903740dc87da01c62040406b8812552e97129a63ea8850a17c6e6"
68
+ checksum = "8d6dbb628b8f8555f86d0323c2eb39e3ec81901f4b83e091db8a6a76d316a333"
63
69
  dependencies = [
64
70
  "shlex",
65
71
  ]
@@ -92,22 +98,22 @@ dependencies = [
92
98
 
93
99
  [[package]]
94
100
  name = "console"
95
- version = "0.15.8"
101
+ version = "0.15.10"
96
102
  source = "registry+https://github.com/rust-lang/crates.io-index"
97
- checksum = "0e1f83fc076bd6dd27517eacdf25fef6c4dfe5f1d7448bafaaf3a26f13b5e4eb"
103
+ checksum = "ea3c6ecd8059b57859df5c69830340ed3c41d30e3da0c1cbed90a96ac853041b"
98
104
  dependencies = [
99
105
  "encode_unicode",
100
- "lazy_static",
101
106
  "libc",
107
+ "once_cell",
102
108
  "unicode-width",
103
109
  "windows-sys",
104
110
  ]
105
111
 
106
112
  [[package]]
107
113
  name = "crossbeam-deque"
108
- version = "0.8.5"
114
+ version = "0.8.6"
109
115
  source = "registry+https://github.com/rust-lang/crates.io-index"
110
- checksum = "613f8cc01fe9cf1a3eb3d7f488fd2fa8388403e97039e2f73692932e291a770d"
116
+ checksum = "9dd111b7b7f7d55b72c0a6ae361660ee5853c9af73f70c3c2ef6858b950e2e51"
111
117
  dependencies = [
112
118
  "crossbeam-epoch",
113
119
  "crossbeam-utils",
@@ -124,9 +130,9 @@ dependencies = [
124
130
 
125
131
  [[package]]
126
132
  name = "crossbeam-utils"
127
- version = "0.8.20"
133
+ version = "0.8.21"
128
134
  source = "registry+https://github.com/rust-lang/crates.io-index"
129
- checksum = "22ec99545bb0ed0ea7bb9b8e1e9122ea386ff8a48c0922e43f36d45ab09e0e80"
135
+ checksum = "d0a5c400df2834b80a4c3327b3aad3a4c4cd4de0629063962b03235697506a28"
130
136
 
131
137
  [[package]]
132
138
  name = "darling"
@@ -165,18 +171,18 @@ dependencies = [
165
171
 
166
172
  [[package]]
167
173
  name = "derive_builder"
168
- version = "0.20.0"
174
+ version = "0.20.2"
169
175
  source = "registry+https://github.com/rust-lang/crates.io-index"
170
- checksum = "0350b5cb0331628a5916d6c5c0b72e97393b8b6b03b47a9284f4e7f5a405ffd7"
176
+ checksum = "507dfb09ea8b7fa618fcf76e953f4f5e192547945816d5358edffe39f6f94947"
171
177
  dependencies = [
172
178
  "derive_builder_macro",
173
179
  ]
174
180
 
175
181
  [[package]]
176
182
  name = "derive_builder_core"
177
- version = "0.20.0"
183
+ version = "0.20.2"
178
184
  source = "registry+https://github.com/rust-lang/crates.io-index"
179
- checksum = "d48cda787f839151732d396ac69e3473923d54312c070ee21e9effcaa8ca0b1d"
185
+ checksum = "2d5bcf7b024d6835cfb3d473887cd966994907effbe9227e8c8219824d06c4e8"
180
186
  dependencies = [
181
187
  "darling",
182
188
  "proc-macro2",
@@ -186,9 +192,9 @@ dependencies = [
186
192
 
187
193
  [[package]]
188
194
  name = "derive_builder_macro"
189
- version = "0.20.0"
195
+ version = "0.20.2"
190
196
  source = "registry+https://github.com/rust-lang/crates.io-index"
191
- checksum = "206868b8242f27cecce124c19fd88157fbd0dd334df2587f36417bafbc85097b"
197
+ checksum = "ab63b0e2bf4d5928aff72e83a7dace85d7bba5fe12dcc3c5a572d78caffd3f3c"
192
198
  dependencies = [
193
199
  "derive_builder_core",
194
200
  "syn",
@@ -202,9 +208,9 @@ checksum = "60b1af1c220855b6ceac025d3f6ecdd2b7c4894bfe9cd9bda4fbb4bc7c0d4cf0"
202
208
 
203
209
  [[package]]
204
210
  name = "encode_unicode"
205
- version = "0.3.6"
211
+ version = "1.0.0"
206
212
  source = "registry+https://github.com/rust-lang/crates.io-index"
207
- checksum = "a357d28ed41a50f9c765dbfe56cbc04a64e53e5fc58ba79fbc34c10ef3df831f"
213
+ checksum = "34aa73646ffb006b8f5147f3dc182bd4bcb190227ce861fc4a4844bf8e3cb2c0"
208
214
 
209
215
  [[package]]
210
216
  name = "esaxx-rs"
@@ -234,9 +240,9 @@ dependencies = [
234
240
 
235
241
  [[package]]
236
242
  name = "glob"
237
- version = "0.3.1"
243
+ version = "0.3.2"
238
244
  source = "registry+https://github.com/rust-lang/crates.io-index"
239
- checksum = "d2fabcfbdc87f4758337ca535fb41a6d701b65693ce38287d856d1674551ec9b"
245
+ checksum = "a8d1add55171497b4705a648c6b583acafb01d58050a51727785f0b2c8e0a2b2"
240
246
 
241
247
  [[package]]
242
248
  name = "ident_case"
@@ -246,24 +252,15 @@ checksum = "b9e0384b61958566e926dc50660321d12159025e767c18e043daf26b70104c39"
246
252
 
247
253
  [[package]]
248
254
  name = "indicatif"
249
- version = "0.17.8"
255
+ version = "0.17.9"
250
256
  source = "registry+https://github.com/rust-lang/crates.io-index"
251
- checksum = "763a5a8f45087d6bcea4222e7b72c291a054edf80e4ef6efd2a4979878c7bea3"
257
+ checksum = "cbf675b85ed934d3c67b5c5469701eec7db22689d0a2139d856e0925fa28b281"
252
258
  dependencies = [
253
259
  "console",
254
- "instant",
255
260
  "number_prefix",
256
261
  "portable-atomic",
257
262
  "unicode-width",
258
- ]
259
-
260
- [[package]]
261
- name = "instant"
262
- version = "0.1.13"
263
- source = "registry+https://github.com/rust-lang/crates.io-index"
264
- checksum = "e0242819d153cba4b4b05a5a8f2a7e9bbf97b6055b2a002b395c96b5ff3c0222"
265
- dependencies = [
266
- "cfg-if",
263
+ "web-time",
267
264
  ]
268
265
 
269
266
  [[package]]
@@ -286,9 +283,19 @@ dependencies = [
286
283
 
287
284
  [[package]]
288
285
  name = "itoa"
289
- version = "1.0.11"
286
+ version = "1.0.14"
290
287
  source = "registry+https://github.com/rust-lang/crates.io-index"
291
- checksum = "49f1f14873335454500d59611f1cf4a4b0f786f9ac11f4312a78e4cf2566695b"
288
+ checksum = "d75a2a4b1b190afb6f5425f10f6a8f959d2ea0b9c2b1d79553551850539e4674"
289
+
290
+ [[package]]
291
+ name = "js-sys"
292
+ version = "0.3.76"
293
+ source = "registry+https://github.com/rust-lang/crates.io-index"
294
+ checksum = "6717b6b5b077764fb5966237269cb3c64edddde4b14ce42647430a78ced9e7b7"
295
+ dependencies = [
296
+ "once_cell",
297
+ "wasm-bindgen",
298
+ ]
292
299
 
293
300
  [[package]]
294
301
  name = "lazy_static"
@@ -304,15 +311,15 @@ checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55"
304
311
 
305
312
  [[package]]
306
313
  name = "libc"
307
- version = "0.2.158"
314
+ version = "0.2.169"
308
315
  source = "registry+https://github.com/rust-lang/crates.io-index"
309
- checksum = "d8adc4bb1803a324070e64a98ae98f38934d91957a99cfb3a43dcbc01bc56439"
316
+ checksum = "b5aba8db14291edd000dfcc4d620c7ebfb122c613afb886ca8803fa4e128a20a"
310
317
 
311
318
  [[package]]
312
319
  name = "libloading"
313
- version = "0.8.5"
320
+ version = "0.8.6"
314
321
  source = "registry+https://github.com/rust-lang/crates.io-index"
315
- checksum = "4979f22fdb869068da03c9f7528f8297c6fd2606bc3a4affe42e6a823fdb8da4"
322
+ checksum = "fc2f4eb4bc735547cfed7c0a4922cbd04a4655978c09b54f1f7b228750664c34"
316
323
  dependencies = [
317
324
  "cfg-if",
318
325
  "windows-targets",
@@ -414,9 +421,9 @@ checksum = "830b246a0e5f20af87141b25c173cd1b609bd7779a4617d6ec582abaf90870f3"
414
421
 
415
422
  [[package]]
416
423
  name = "once_cell"
417
- version = "1.19.0"
424
+ version = "1.20.2"
418
425
  source = "registry+https://github.com/rust-lang/crates.io-index"
419
- checksum = "3fdb12b2476b595f9358c5161aa467c2438859caa136dec86c26fdd2efe17b92"
426
+ checksum = "1261fe7e33c73b354eab43b1273a57c8f967d0391e80353e51f764ac02cf6775"
420
427
 
421
428
  [[package]]
422
429
  name = "onig"
@@ -448,15 +455,15 @@ checksum = "57c0d7b74b563b49d38dae00a0c37d4d6de9b432382b2892f0574ddcae73fd0a"
448
455
 
449
456
  [[package]]
450
457
  name = "pkg-config"
451
- version = "0.3.30"
458
+ version = "0.3.31"
452
459
  source = "registry+https://github.com/rust-lang/crates.io-index"
453
- checksum = "d231b230927b5e4ad203db57bbcbee2802f6bce620b1e4a9024a07d94e2907ec"
460
+ checksum = "953ec861398dccce10c670dfeaf3ec4911ca479e9c02154b3a215178c5f566f2"
454
461
 
455
462
  [[package]]
456
463
  name = "portable-atomic"
457
- version = "1.7.0"
464
+ version = "1.10.0"
458
465
  source = "registry+https://github.com/rust-lang/crates.io-index"
459
- checksum = "da544ee218f0d287a911e9c99a39a8c9bc8fcad3cb8db5959940044ecfc67265"
466
+ checksum = "280dc24453071f1b63954171985a0b0d30058d287960968b9b2aca264c8d4ee6"
460
467
 
461
468
  [[package]]
462
469
  name = "ppv-lite86"
@@ -469,18 +476,18 @@ dependencies = [
469
476
 
470
477
  [[package]]
471
478
  name = "proc-macro2"
472
- version = "1.0.86"
479
+ version = "1.0.92"
473
480
  source = "registry+https://github.com/rust-lang/crates.io-index"
474
- checksum = "5e719e8df665df0d1c8fbfd238015744736151d4445ec0836b8e628aae103b77"
481
+ checksum = "37d3544b3f2748c54e147655edb5025752e2303145b5aefb3c3ea2c78b973bb0"
475
482
  dependencies = [
476
483
  "unicode-ident",
477
484
  ]
478
485
 
479
486
  [[package]]
480
487
  name = "quote"
481
- version = "1.0.37"
488
+ version = "1.0.38"
482
489
  source = "registry+https://github.com/rust-lang/crates.io-index"
483
- checksum = "b5b9d34b8991d19d98081b46eacdd8eb58c6f2b201139f7c5f643cc155a633af"
490
+ checksum = "0e4dccaaaf89514f546c693ddc140f729f958c247918a13380cccc6078391acc"
484
491
  dependencies = [
485
492
  "proc-macro2",
486
493
  ]
@@ -548,18 +555,18 @@ dependencies = [
548
555
 
549
556
  [[package]]
550
557
  name = "rb-sys"
551
- version = "0.9.102"
558
+ version = "0.9.105"
552
559
  source = "registry+https://github.com/rust-lang/crates.io-index"
553
- checksum = "df4dec4b1d304c3b308a2cd86b1216ea45dd4361f4e9fa056f108332d0a450c1"
560
+ checksum = "4b3a1f3ce8e7c36d777d52fe7a99039fe4fea7c8ec355a4c4f3a17f92a14029f"
554
561
  dependencies = [
555
562
  "rb-sys-build",
556
563
  ]
557
564
 
558
565
  [[package]]
559
566
  name = "rb-sys-build"
560
- version = "0.9.102"
567
+ version = "0.9.105"
561
568
  source = "registry+https://github.com/rust-lang/crates.io-index"
562
- checksum = "1d71de3e29d174b8fb17b5d4470f27d7aa2605f8a9d05fda0d3aeff30e05a570"
569
+ checksum = "3e6b246c29c0809e1cbe60a1ba9e093da72a4676d02adc68469297d1e589bbf0"
563
570
  dependencies = [
564
571
  "bindgen",
565
572
  "lazy_static",
@@ -578,9 +585,9 @@ checksum = "a35802679f07360454b418a5d1735c89716bde01d35b1560fc953c1415a0b3bb"
578
585
 
579
586
  [[package]]
580
587
  name = "regex"
581
- version = "1.10.6"
588
+ version = "1.11.1"
582
589
  source = "registry+https://github.com/rust-lang/crates.io-index"
583
- checksum = "4219d74c6b67a3654a9fbebc4b419e22126d13d2f3c4a07ee0cb61ff79a79619"
590
+ checksum = "b544ef1b4eac5dc2db33ea63606ae9ffcfac26c1416a2806ae0bf5f56b201191"
584
591
  dependencies = [
585
592
  "aho-corasick",
586
593
  "memchr",
@@ -590,9 +597,9 @@ dependencies = [
590
597
 
591
598
  [[package]]
592
599
  name = "regex-automata"
593
- version = "0.4.7"
600
+ version = "0.4.9"
594
601
  source = "registry+https://github.com/rust-lang/crates.io-index"
595
- checksum = "38caf58cc5ef2fed281f89292ef23f6365465ed9a41b7a7754eb4e26496c92df"
602
+ checksum = "809e8dc61f6de73b46c85f4c96486310fe304c434cfa43669d7b40f711150908"
596
603
  dependencies = [
597
604
  "aho-corasick",
598
605
  "memchr",
@@ -601,9 +608,9 @@ dependencies = [
601
608
 
602
609
  [[package]]
603
610
  name = "regex-syntax"
604
- version = "0.8.4"
611
+ version = "0.8.5"
605
612
  source = "registry+https://github.com/rust-lang/crates.io-index"
606
- checksum = "7a66a03ae7c801facd77a29370b4faec201768915ac14a721ba36f20bc9c209b"
613
+ checksum = "2b15c43186be67a4fd63bee50d0303afffcef381492ebe2c5d87f324e1b8815c"
607
614
 
608
615
  [[package]]
609
616
  name = "rustc-hash"
@@ -625,18 +632,18 @@ checksum = "a3f0bf26fd526d2a95683cd0f87bf103b8539e2ca1ef48ce002d67aad59aa0b4"
625
632
 
626
633
  [[package]]
627
634
  name = "serde"
628
- version = "1.0.209"
635
+ version = "1.0.217"
629
636
  source = "registry+https://github.com/rust-lang/crates.io-index"
630
- checksum = "99fce0ffe7310761ca6bf9faf5115afbc19688edd00171d81b1bb1b116c63e09"
637
+ checksum = "02fc4265df13d6fa1d00ecff087228cc0a2b5f3c0e87e258d8b94a156e984c70"
631
638
  dependencies = [
632
639
  "serde_derive",
633
640
  ]
634
641
 
635
642
  [[package]]
636
643
  name = "serde_derive"
637
- version = "1.0.209"
644
+ version = "1.0.217"
638
645
  source = "registry+https://github.com/rust-lang/crates.io-index"
639
- checksum = "a5831b979fd7b5439637af1752d535ff49f4860c0f341d1baeb6faf0f4242170"
646
+ checksum = "5a9bf7cf98d04a2b28aead066b7496853d4779c9cc183c440dbac457641e19a0"
640
647
  dependencies = [
641
648
  "proc-macro2",
642
649
  "quote",
@@ -645,9 +652,9 @@ dependencies = [
645
652
 
646
653
  [[package]]
647
654
  name = "serde_json"
648
- version = "1.0.127"
655
+ version = "1.0.134"
649
656
  source = "registry+https://github.com/rust-lang/crates.io-index"
650
- checksum = "8043c06d9f82bd7271361ed64f415fe5e12a77fdb52e573e7f06a516dea329ad"
657
+ checksum = "d00f4175c42ee48b15416f6193a959ba3a0d67fc699a0db9ad12df9f83991c7d"
651
658
  dependencies = [
652
659
  "itoa",
653
660
  "memchr",
@@ -693,9 +700,9 @@ checksum = "7da8b5736845d9f2fcb837ea5d9e2628564b3b043a70948a3f0b778838c5fb4f"
693
700
 
694
701
  [[package]]
695
702
  name = "syn"
696
- version = "2.0.76"
703
+ version = "2.0.93"
697
704
  source = "registry+https://github.com/rust-lang/crates.io-index"
698
- checksum = "578e081a14e0cefc3279b0472138c513f37b41a08d5a3cca9b6e4e8ceb6cd525"
705
+ checksum = "9c786062daee0d6db1132800e623df74274a0a87322d8e183338e01b3d98d058"
699
706
  dependencies = [
700
707
  "proc-macro2",
701
708
  "quote",
@@ -704,18 +711,18 @@ dependencies = [
704
711
 
705
712
  [[package]]
706
713
  name = "thiserror"
707
- version = "1.0.63"
714
+ version = "1.0.69"
708
715
  source = "registry+https://github.com/rust-lang/crates.io-index"
709
- checksum = "c0342370b38b6a11b6cc11d6a805569958d54cfa061a29969c3b5ce2ea405724"
716
+ checksum = "b6aaf5339b578ea85b50e080feb250a3e8ae8cfcdff9a461c9ec2904bc923f52"
710
717
  dependencies = [
711
718
  "thiserror-impl",
712
719
  ]
713
720
 
714
721
  [[package]]
715
722
  name = "thiserror-impl"
716
- version = "1.0.63"
723
+ version = "1.0.69"
717
724
  source = "registry+https://github.com/rust-lang/crates.io-index"
718
- checksum = "a4558b58466b9ad7ca0f102865eccc95938dca1a74a856f2b57b6629050da261"
725
+ checksum = "4fee6c4efc90059e10f81e6d42c60a18f76588c3d74cb83a0b242a2b6c7504c1"
719
726
  dependencies = [
720
727
  "proc-macro2",
721
728
  "quote",
@@ -724,19 +731,19 @@ dependencies = [
724
731
 
725
732
  [[package]]
726
733
  name = "tokenizers"
727
- version = "0.5.3"
734
+ version = "0.5.4"
728
735
  dependencies = [
729
736
  "magnus",
730
737
  "onig",
731
738
  "serde",
732
- "tokenizers 0.20.0",
739
+ "tokenizers 0.21.0",
733
740
  ]
734
741
 
735
742
  [[package]]
736
743
  name = "tokenizers"
737
- version = "0.20.0"
744
+ version = "0.21.0"
738
745
  source = "registry+https://github.com/rust-lang/crates.io-index"
739
- checksum = "c8a24d7f7d6be5b9d1377418b893ab1808af0074f5d1bb2c64784452ddd2aa70"
746
+ checksum = "9ecededfed68a69bc657e486510089e255e53c3d38cc7d4d59c8742668ca2cae"
740
747
  dependencies = [
741
748
  "aho-corasick",
742
749
  "derive_builder",
@@ -766,9 +773,9 @@ dependencies = [
766
773
 
767
774
  [[package]]
768
775
  name = "unicode-ident"
769
- version = "1.0.12"
776
+ version = "1.0.14"
770
777
  source = "registry+https://github.com/rust-lang/crates.io-index"
771
- checksum = "3354b9ac3fae1ff6755cb6db53683adb661634f67557942dea4facebec0fee4b"
778
+ checksum = "adb9e6ca4f869e1180728b7950e35922a7fc6397f7b641499e8f3ef06e50dc83"
772
779
 
773
780
  [[package]]
774
781
  name = "unicode-normalization-alignments"
@@ -781,15 +788,15 @@ dependencies = [
781
788
 
782
789
  [[package]]
783
790
  name = "unicode-segmentation"
784
- version = "1.11.0"
791
+ version = "1.12.0"
785
792
  source = "registry+https://github.com/rust-lang/crates.io-index"
786
- checksum = "d4c87d22b6e3f4a18d4d40ef354e97c90fcb14dd91d7dc0aa9d8a1172ebf7202"
793
+ checksum = "f6ccf251212114b54433ec949fd6a7841275f9ada20dddd2f29e9ceea4501493"
787
794
 
788
795
  [[package]]
789
796
  name = "unicode-width"
790
- version = "0.1.13"
797
+ version = "0.2.0"
791
798
  source = "registry+https://github.com/rust-lang/crates.io-index"
792
- checksum = "0336d538f7abc86d282a4189614dfaa90810dfc2c6f6427eaf88e16311dd225d"
799
+ checksum = "1fc81956842c57dac11422a97c3b8195a1ff727f06e85c84ed2e8aa277c9a0fd"
793
800
 
794
801
  [[package]]
795
802
  name = "unicode_categories"
@@ -803,11 +810,75 @@ version = "0.11.0+wasi-snapshot-preview1"
803
810
  source = "registry+https://github.com/rust-lang/crates.io-index"
804
811
  checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
805
812
 
813
+ [[package]]
814
+ name = "wasm-bindgen"
815
+ version = "0.2.99"
816
+ source = "registry+https://github.com/rust-lang/crates.io-index"
817
+ checksum = "a474f6281d1d70c17ae7aa6a613c87fce69a127e2624002df63dcb39d6cf6396"
818
+ dependencies = [
819
+ "cfg-if",
820
+ "once_cell",
821
+ "wasm-bindgen-macro",
822
+ ]
823
+
824
+ [[package]]
825
+ name = "wasm-bindgen-backend"
826
+ version = "0.2.99"
827
+ source = "registry+https://github.com/rust-lang/crates.io-index"
828
+ checksum = "5f89bb38646b4f81674e8f5c3fb81b562be1fd936d84320f3264486418519c79"
829
+ dependencies = [
830
+ "bumpalo",
831
+ "log",
832
+ "proc-macro2",
833
+ "quote",
834
+ "syn",
835
+ "wasm-bindgen-shared",
836
+ ]
837
+
838
+ [[package]]
839
+ name = "wasm-bindgen-macro"
840
+ version = "0.2.99"
841
+ source = "registry+https://github.com/rust-lang/crates.io-index"
842
+ checksum = "2cc6181fd9a7492eef6fef1f33961e3695e4579b9872a6f7c83aee556666d4fe"
843
+ dependencies = [
844
+ "quote",
845
+ "wasm-bindgen-macro-support",
846
+ ]
847
+
848
+ [[package]]
849
+ name = "wasm-bindgen-macro-support"
850
+ version = "0.2.99"
851
+ source = "registry+https://github.com/rust-lang/crates.io-index"
852
+ checksum = "30d7a95b763d3c45903ed6c81f156801839e5ee968bb07e534c44df0fcd330c2"
853
+ dependencies = [
854
+ "proc-macro2",
855
+ "quote",
856
+ "syn",
857
+ "wasm-bindgen-backend",
858
+ "wasm-bindgen-shared",
859
+ ]
860
+
861
+ [[package]]
862
+ name = "wasm-bindgen-shared"
863
+ version = "0.2.99"
864
+ source = "registry+https://github.com/rust-lang/crates.io-index"
865
+ checksum = "943aab3fdaaa029a6e0271b35ea10b72b943135afe9bffca82384098ad0e06a6"
866
+
867
+ [[package]]
868
+ name = "web-time"
869
+ version = "1.1.0"
870
+ source = "registry+https://github.com/rust-lang/crates.io-index"
871
+ checksum = "5a6580f308b1fad9207618087a65c04e7a10bc77e02c8e84e9b00dd4b12fa0bb"
872
+ dependencies = [
873
+ "js-sys",
874
+ "wasm-bindgen",
875
+ ]
876
+
806
877
  [[package]]
807
878
  name = "windows-sys"
808
- version = "0.52.0"
879
+ version = "0.59.0"
809
880
  source = "registry+https://github.com/rust-lang/crates.io-index"
810
- checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
881
+ checksum = "1e38bc4d79ed67fd075bcc251a1c39b32a1776bbe92e5bef1f0bf1f8c531853b"
811
882
  dependencies = [
812
883
  "windows-targets",
813
884
  ]
@@ -10,7 +10,7 @@ base64 v0.13.1
10
10
  https://github.com/marshallpierce/rust-base64
11
11
  MIT/Apache-2.0
12
12
 
13
- bindgen v0.69.4
13
+ bindgen v0.69.5
14
14
  https://rust-lang.github.io/rust-bindgen/
15
15
  BSD-3-Clause
16
16
 
@@ -26,7 +26,7 @@ byteorder v1.5.0
26
26
  https://github.com/BurntSushi/byteorder
27
27
  Unlicense OR MIT
28
28
 
29
- cc v1.1.15
29
+ cc v1.2.6
30
30
  https://github.com/rust-lang/cc-rs
31
31
  MIT OR Apache-2.0
32
32
 
@@ -42,11 +42,11 @@ clang-sys v1.8.1
42
42
  https://github.com/KyleMayes/clang-sys
43
43
  Apache-2.0
44
44
 
45
- console v0.15.8
45
+ console v0.15.10
46
46
  https://github.com/console-rs/console
47
47
  MIT
48
48
 
49
- crossbeam-deque v0.8.5
49
+ crossbeam-deque v0.8.6
50
50
  https://github.com/crossbeam-rs/crossbeam/tree/master/crossbeam-deque
51
51
  MIT OR Apache-2.0
52
52
 
@@ -54,7 +54,7 @@ crossbeam-epoch v0.9.18
54
54
  https://github.com/crossbeam-rs/crossbeam/tree/master/crossbeam-epoch
55
55
  MIT OR Apache-2.0
56
56
 
57
- crossbeam-utils v0.8.20
57
+ crossbeam-utils v0.8.21
58
58
  https://github.com/crossbeam-rs/crossbeam/tree/master/crossbeam-utils
59
59
  MIT OR Apache-2.0
60
60
 
@@ -70,15 +70,15 @@ darling_macro v0.20.10
70
70
  https://github.com/TedDriggs/darling
71
71
  MIT
72
72
 
73
- derive_builder v0.20.0
73
+ derive_builder v0.20.2
74
74
  https://github.com/colin-kiegel/rust-derive-builder
75
75
  MIT OR Apache-2.0
76
76
 
77
- derive_builder_core v0.20.0
77
+ derive_builder_core v0.20.2
78
78
  https://github.com/colin-kiegel/rust-derive-builder
79
79
  MIT OR Apache-2.0
80
80
 
81
- derive_builder_macro v0.20.0
81
+ derive_builder_macro v0.20.2
82
82
  https://github.com/colin-kiegel/rust-derive-builder
83
83
  MIT OR Apache-2.0
84
84
 
@@ -86,9 +86,9 @@ either v1.13.0
86
86
  https://github.com/rayon-rs/either
87
87
  MIT OR Apache-2.0
88
88
 
89
- encode_unicode v0.3.6
89
+ encode_unicode v1.0.0
90
90
  https://github.com/tormol/encode_unicode
91
- MIT/Apache-2.0
91
+ Apache-2.0 OR MIT
92
92
 
93
93
  esaxx-rs v0.1.10
94
94
  https://github.com/Narsil/esaxx-rs
@@ -102,7 +102,7 @@ getrandom v0.2.15
102
102
  https://github.com/rust-random/getrandom
103
103
  MIT OR Apache-2.0
104
104
 
105
- glob v0.3.1
105
+ glob v0.3.2
106
106
  https://github.com/rust-lang/glob
107
107
  MIT OR Apache-2.0
108
108
 
@@ -110,7 +110,7 @@ ident_case v1.0.1
110
110
  https://github.com/TedDriggs/ident_case
111
111
  MIT/Apache-2.0
112
112
 
113
- indicatif v0.17.8
113
+ indicatif v0.17.9
114
114
  https://github.com/console-rs/indicatif
115
115
  MIT
116
116
 
@@ -122,7 +122,7 @@ itertools v0.12.1
122
122
  https://github.com/rust-itertools/itertools
123
123
  MIT OR Apache-2.0
124
124
 
125
- itoa v1.0.11
125
+ itoa v1.0.14
126
126
  https://github.com/dtolnay/itoa
127
127
  MIT OR Apache-2.0
128
128
 
@@ -134,11 +134,11 @@ lazycell v1.3.0
134
134
  https://github.com/indiv0/lazycell
135
135
  MIT/Apache-2.0
136
136
 
137
- libc v0.2.158
137
+ libc v0.2.169
138
138
  https://github.com/rust-lang/libc
139
139
  MIT OR Apache-2.0
140
140
 
141
- libloading v0.8.5
141
+ libloading v0.8.6
142
142
  https://github.com/nagisa/rust_libloading/
143
143
  ISC
144
144
 
@@ -186,7 +186,7 @@ number_prefix v0.4.0
186
186
  https://github.com/ogham/rust-number-prefix
187
187
  MIT
188
188
 
189
- once_cell v1.19.0
189
+ once_cell v1.20.2
190
190
  https://github.com/matklad/once_cell
191
191
  MIT OR Apache-2.0
192
192
 
@@ -202,11 +202,11 @@ paste v1.0.15
202
202
  https://github.com/dtolnay/paste
203
203
  MIT OR Apache-2.0
204
204
 
205
- pkg-config v0.3.30
205
+ pkg-config v0.3.31
206
206
  https://github.com/rust-lang/pkg-config-rs
207
207
  MIT OR Apache-2.0
208
208
 
209
- portable-atomic v1.7.0
209
+ portable-atomic v1.10.0
210
210
  https://github.com/taiki-e/portable-atomic
211
211
  Apache-2.0 OR MIT
212
212
 
@@ -214,11 +214,11 @@ ppv-lite86 v0.2.20
214
214
  https://github.com/cryptocorrosion/cryptocorrosion
215
215
  MIT/Apache-2.0
216
216
 
217
- proc-macro2 v1.0.86
217
+ proc-macro2 v1.0.92
218
218
  https://github.com/dtolnay/proc-macro2
219
219
  MIT OR Apache-2.0
220
220
 
221
- quote v1.0.37
221
+ quote v1.0.38
222
222
  https://github.com/dtolnay/quote
223
223
  MIT OR Apache-2.0
224
224
 
@@ -246,11 +246,11 @@ rayon-core v1.12.1
246
246
  https://github.com/rayon-rs/rayon
247
247
  MIT OR Apache-2.0
248
248
 
249
- rb-sys v0.9.102
249
+ rb-sys v0.9.105
250
250
  https://github.com/oxidize-rb/rb-sys
251
251
  MIT OR Apache-2.0
252
252
 
253
- rb-sys-build v0.9.102
253
+ rb-sys-build v0.9.105
254
254
  https://github.com/oxidize-rb/rb-sys
255
255
  MIT OR Apache-2.0
256
256
 
@@ -258,15 +258,15 @@ rb-sys-env v0.1.2
258
258
  https://github.com/oxidize-rb/rb-sys
259
259
  MIT OR Apache-2.0
260
260
 
261
- regex v1.10.6
261
+ regex v1.11.1
262
262
  https://github.com/rust-lang/regex
263
263
  MIT OR Apache-2.0
264
264
 
265
- regex-automata v0.4.7
265
+ regex-automata v0.4.9
266
266
  https://github.com/rust-lang/regex/tree/master/regex-automata
267
267
  MIT OR Apache-2.0
268
268
 
269
- regex-syntax v0.8.4
269
+ regex-syntax v0.8.5
270
270
  https://github.com/rust-lang/regex/tree/master/regex-syntax
271
271
  MIT OR Apache-2.0
272
272
 
@@ -282,15 +282,15 @@ seq-macro v0.3.5
282
282
  https://github.com/dtolnay/seq-macro
283
283
  MIT OR Apache-2.0
284
284
 
285
- serde v1.0.209
285
+ serde v1.0.217
286
286
  https://serde.rs
287
287
  MIT OR Apache-2.0
288
288
 
289
- serde_derive v1.0.209
289
+ serde_derive v1.0.217
290
290
  https://serde.rs
291
291
  MIT OR Apache-2.0
292
292
 
293
- serde_json v1.0.127
293
+ serde_json v1.0.134
294
294
  https://github.com/serde-rs/json
295
295
  MIT OR Apache-2.0
296
296
 
@@ -314,35 +314,35 @@ strsim v0.11.1
314
314
  https://github.com/rapidfuzz/strsim-rs
315
315
  MIT
316
316
 
317
- syn v2.0.76
317
+ syn v2.0.93
318
318
  https://github.com/dtolnay/syn
319
319
  MIT OR Apache-2.0
320
320
 
321
- thiserror v1.0.63
321
+ thiserror v1.0.69
322
322
  https://github.com/dtolnay/thiserror
323
323
  MIT OR Apache-2.0
324
324
 
325
- thiserror-impl v1.0.63
325
+ thiserror-impl v1.0.69
326
326
  https://github.com/dtolnay/thiserror
327
327
  MIT OR Apache-2.0
328
328
 
329
- tokenizers v0.20.0
329
+ tokenizers v0.21.0
330
330
  https://github.com/huggingface/tokenizers
331
331
  Apache-2.0
332
332
 
333
- unicode-ident v1.0.12
333
+ unicode-ident v1.0.14
334
334
  https://github.com/dtolnay/unicode-ident
335
- (MIT OR Apache-2.0) AND Unicode-DFS-2016
335
+ (MIT OR Apache-2.0) AND Unicode-3.0
336
336
 
337
337
  unicode-normalization-alignments v0.1.12
338
338
  https://github.com/n1t0/unicode-normalization
339
339
  MIT/Apache-2.0
340
340
 
341
- unicode-segmentation v1.11.0
341
+ unicode-segmentation v1.12.0
342
342
  https://github.com/unicode-rs/unicode-segmentation
343
- MIT/Apache-2.0
343
+ MIT OR Apache-2.0
344
344
 
345
- unicode-width v0.1.13
345
+ unicode-width v0.2.0
346
346
  https://github.com/unicode-rs/unicode-width
347
347
  MIT OR Apache-2.0
348
348
 
@@ -350,7 +350,7 @@ unicode_categories v0.1.1
350
350
  https://github.com/swgillespie/unicode-categories
351
351
  MIT OR Apache-2.0
352
352
 
353
- windows-sys v0.52.0
353
+ windows-sys v0.59.0
354
354
  https://github.com/microsoft/windows-rs
355
355
  MIT OR Apache-2.0
356
356
 
@@ -15619,52 +15619,45 @@ DEALINGS IN THE SOFTWARE.
15619
15619
  unicode-ident LICENSE-UNICODE
15620
15620
  ================================================================================
15621
15621
 
15622
- UNICODE, INC. LICENSE AGREEMENT - DATA FILES AND SOFTWARE
15623
-
15624
- See Terms of Use <https://www.unicode.org/copyright.html>
15625
- for definitions of Unicode Inc.’s Data Files and Software.
15626
-
15627
- NOTICE TO USER: Carefully read the following legal agreement.
15628
- BY DOWNLOADING, INSTALLING, COPYING OR OTHERWISE USING UNICODE INC.'S
15629
- DATA FILES ("DATA FILES"), AND/OR SOFTWARE ("SOFTWARE"),
15630
- YOU UNEQUIVOCALLY ACCEPT, AND AGREE TO BE BOUND BY, ALL OF THE
15631
- TERMS AND CONDITIONS OF THIS AGREEMENT.
15632
- IF YOU DO NOT AGREE, DO NOT DOWNLOAD, INSTALL, COPY, DISTRIBUTE OR USE
15633
- THE DATA FILES OR SOFTWARE.
15622
+ UNICODE LICENSE V3
15634
15623
 
15635
15624
  COPYRIGHT AND PERMISSION NOTICE
15636
15625
 
15637
- Copyright © 1991-2022 Unicode, Inc. All rights reserved.
15638
- Distributed under the Terms of Use in https://www.unicode.org/copyright.html.
15639
-
15640
- Permission is hereby granted, free of charge, to any person obtaining
15641
- a copy of the Unicode data files and any associated documentation
15642
- (the "Data Files") or Unicode software and any associated documentation
15643
- (the "Software") to deal in the Data Files or Software
15644
- without restriction, including without limitation the rights to use,
15645
- copy, modify, merge, publish, distribute, and/or sell copies of
15646
- the Data Files or Software, and to permit persons to whom the Data Files
15647
- or Software are furnished to do so, provided that either
15648
- (a) this copyright and permission notice appear with all copies
15649
- of the Data Files or Software, or
15650
- (b) this copyright and permission notice appear in associated
15651
- Documentation.
15652
-
15653
- THE DATA FILES AND SOFTWARE ARE PROVIDED "AS IS", WITHOUT WARRANTY OF
15654
- ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE
15655
- WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
15656
- NONINFRINGEMENT OF THIRD PARTY RIGHTS.
15657
- IN NO EVENT SHALL THE COPYRIGHT HOLDER OR HOLDERS INCLUDED IN THIS
15658
- NOTICE BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL INDIRECT OR CONSEQUENTIAL
15659
- DAMAGES, OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE,
15660
- DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
15661
- TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
15662
- PERFORMANCE OF THE DATA FILES OR SOFTWARE.
15663
-
15664
- Except as contained in this notice, the name of a copyright holder
15665
- shall not be used in advertising or otherwise to promote the sale,
15666
- use or other dealings in these Data Files or Software without prior
15667
- written authorization of the copyright holder.
15626
+ Copyright © 1991-2023 Unicode, Inc.
15627
+
15628
+ NOTICE TO USER: Carefully read the following legal agreement. BY
15629
+ DOWNLOADING, INSTALLING, COPYING OR OTHERWISE USING DATA FILES, AND/OR
15630
+ SOFTWARE, YOU UNEQUIVOCALLY ACCEPT, AND AGREE TO BE BOUND BY, ALL OF THE
15631
+ TERMS AND CONDITIONS OF THIS AGREEMENT. IF YOU DO NOT AGREE, DO NOT
15632
+ DOWNLOAD, INSTALL, COPY, DISTRIBUTE OR USE THE DATA FILES OR SOFTWARE.
15633
+
15634
+ Permission is hereby granted, free of charge, to any person obtaining a
15635
+ copy of data files and any associated documentation (the "Data Files") or
15636
+ software and any associated documentation (the "Software") to deal in the
15637
+ Data Files or Software without restriction, including without limitation
15638
+ the rights to use, copy, modify, merge, publish, distribute, and/or sell
15639
+ copies of the Data Files or Software, and to permit persons to whom the
15640
+ Data Files or Software are furnished to do so, provided that either (a)
15641
+ this copyright and permission notice appear with all copies of the Data
15642
+ Files or Software, or (b) this copyright and permission notice appear in
15643
+ associated Documentation.
15644
+
15645
+ THE DATA FILES AND SOFTWARE ARE PROVIDED "AS IS", WITHOUT WARRANTY OF ANY
15646
+ KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
15647
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT OF
15648
+ THIRD PARTY RIGHTS.
15649
+
15650
+ IN NO EVENT SHALL THE COPYRIGHT HOLDER OR HOLDERS INCLUDED IN THIS NOTICE
15651
+ BE LIABLE FOR ANY CLAIM, OR ANY SPECIAL INDIRECT OR CONSEQUENTIAL DAMAGES,
15652
+ OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS,
15653
+ WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,
15654
+ ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THE DATA
15655
+ FILES OR SOFTWARE.
15656
+
15657
+ Except as contained in this notice, the name of a copyright holder shall
15658
+ not be used in advertising or otherwise to promote the sale, use or other
15659
+ dealings in these Data Files or Software without prior written
15660
+ authorization of the copyright holder.
15668
15661
 
15669
15662
  ================================================================================
15670
15663
  unicode-normalization-alignments LICENSE-APACHE
Binary file
Binary file
Binary file
Binary file
@@ -1,7 +1,7 @@
1
1
  module Tokenizers
2
2
  module FromPretrained
3
3
  # for user agent
4
- TOKENIZERS_VERSION = "0.20.0"
4
+ TOKENIZERS_VERSION = "0.21.0"
5
5
 
6
6
  # use Ruby for downloads
7
7
  # this avoids the need to vendor OpenSSL on Linux
@@ -1,3 +1,3 @@
1
1
  module Tokenizers
2
- VERSION = "0.5.3"
2
+ VERSION = "0.5.4"
3
3
  end
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: tokenizers
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.5.3
4
+ version: 0.5.4
5
5
  platform: x64-mingw-ucrt
6
6
  authors:
7
7
  - Andrew Kane
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2024-09-17 00:00:00.000000000 Z
11
+ date: 2024-12-29 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description:
14
14
  email: andrew@ankane.org
@@ -26,6 +26,7 @@ files:
26
26
  - lib/tokenizers/3.1/tokenizers.so
27
27
  - lib/tokenizers/3.2/tokenizers.so
28
28
  - lib/tokenizers/3.3/tokenizers.so
29
+ - lib/tokenizers/3.4/tokenizers.so
29
30
  - lib/tokenizers/added_token.rb
30
31
  - lib/tokenizers/char_bpe_tokenizer.rb
31
32
  - lib/tokenizers/decoders/bpe_decoder.rb
@@ -71,14 +72,14 @@ required_ruby_version: !ruby/object:Gem::Requirement
71
72
  version: '3.1'
72
73
  - - "<"
73
74
  - !ruby/object:Gem::Version
74
- version: 3.4.dev
75
+ version: 3.5.dev
75
76
  required_rubygems_version: !ruby/object:Gem::Requirement
76
77
  requirements:
77
78
  - - ">="
78
79
  - !ruby/object:Gem::Version
79
80
  version: '0'
80
81
  requirements: []
81
- rubygems_version: 3.4.4
82
+ rubygems_version: 3.5.23
82
83
  signing_key:
83
84
  specification_version: 4
84
85
  summary: Fast state-of-the-art tokenizers for Ruby