tokenizers 0.3.1-arm64-darwin → 0.3.2-arm64-darwin
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +9 -5
- data/Cargo.lock +12 -7
- data/LICENSE-THIRD-PARTY.txt +3 -29
- data/lib/tokenizers/2.7/tokenizers.bundle +0 -0
- data/lib/tokenizers/3.0/tokenizers.bundle +0 -0
- data/lib/tokenizers/3.1/tokenizers.bundle +0 -0
- data/lib/tokenizers/3.2/tokenizers.bundle +0 -0
- data/lib/tokenizers/version.rb +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: ba8379e40522e811dfd2d2082a241e4c8bb71f0d42fe0219175d65318b5d0f64
|
4
|
+
data.tar.gz: 9f731c1aa940e44828276cc765adec19a1d3bad6bea84260992b491cc892bce5
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 322363a3f931652734fcca0a39a363fd7c1538096bc70ed6a3dde80bb88f5690f412ea82bf193b148ae95369c88cc25ecaeba9f2911ad859d93e2e2219a260ff
|
7
|
+
data.tar.gz: 49061d4df62725e1224024921c2c8bb1ca9e18c60efb630c9345c25d7811508280add5223dabedbd9c1870555189c6650efb137627e31383535a54dffe12d9b1
|
data/CHANGELOG.md
CHANGED
@@ -1,8 +1,12 @@
|
|
1
|
-
## 0.3.
|
1
|
+
## 0.3.2 (2023-03-06)
|
2
|
+
|
3
|
+
- Added precompiled gem for Linux x86-64 MUSL
|
4
|
+
|
5
|
+
## 0.3.1 (2023-02-08)
|
2
6
|
|
3
7
|
- Fixed error with Ruby 2.7
|
4
8
|
|
5
|
-
## 0.3.0 (
|
9
|
+
## 0.3.0 (2023-02-07)
|
6
10
|
|
7
11
|
- Added support for training tokenizers
|
8
12
|
- Added more methods to `Tokenizer`
|
@@ -11,20 +15,20 @@
|
|
11
15
|
- Changed `encode` method to include special tokens by default
|
12
16
|
- Changed how offsets are calculated for strings with multibyte characters
|
13
17
|
|
14
|
-
## 0.2.3 (
|
18
|
+
## 0.2.3 (2023-01-22)
|
15
19
|
|
16
20
|
- Added `add_special_tokens` option to `encode` method
|
17
21
|
- Added warning about `encode` method including special tokens by default in 0.3.0
|
18
22
|
- Added more methods to `Encoding`
|
19
23
|
- Fixed error with precompiled gem on Mac ARM
|
20
24
|
|
21
|
-
## 0.2.2 (
|
25
|
+
## 0.2.2 (2023-01-15)
|
22
26
|
|
23
27
|
- Added precompiled gem for Linux ARM
|
24
28
|
- Added `from_file` method
|
25
29
|
- Fixed error with precompiled gem on Linux x86-64
|
26
30
|
|
27
|
-
## 0.2.1 (
|
31
|
+
## 0.2.1 (2023-01-12)
|
28
32
|
|
29
33
|
- Added support for Ruby 3.2
|
30
34
|
|
data/Cargo.lock
CHANGED
@@ -353,7 +353,8 @@ checksum = "58093314a45e00c77d5c508f76e77c3396afbbc0d01506e7fae47b018bac2b1d"
|
|
353
353
|
[[package]]
|
354
354
|
name = "magnus"
|
355
355
|
version = "0.5.0"
|
356
|
-
source = "
|
356
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
357
|
+
checksum = "af37419a942477f606d227d0e6e92f3b68458bfc68fec3bc2629df6a2c1ccdf9"
|
357
358
|
dependencies = [
|
358
359
|
"magnus-macros",
|
359
360
|
"rb-sys",
|
@@ -362,8 +363,9 @@ dependencies = [
|
|
362
363
|
|
363
364
|
[[package]]
|
364
365
|
name = "magnus-macros"
|
365
|
-
version = "0.
|
366
|
-
source = "
|
366
|
+
version = "0.4.0"
|
367
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
368
|
+
checksum = "85aa71c9891b2732ff1157e1860a1ee578459fd25811fd3d72cc6e32b3fbdfea"
|
367
369
|
dependencies = [
|
368
370
|
"proc-macro2",
|
369
371
|
"quote",
|
@@ -552,22 +554,25 @@ dependencies = [
|
|
552
554
|
|
553
555
|
[[package]]
|
554
556
|
name = "rb-sys"
|
555
|
-
version = "0.9.
|
557
|
+
version = "0.9.65"
|
556
558
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
557
|
-
checksum = "
|
559
|
+
checksum = "e8fe617bad8e88fd7e5d6f432e35f09e5f94144dfb8e8ee4adde82fb920dc59b"
|
558
560
|
dependencies = [
|
559
561
|
"rb-sys-build",
|
560
562
|
]
|
561
563
|
|
562
564
|
[[package]]
|
563
565
|
name = "rb-sys-build"
|
564
|
-
version = "0.9.
|
566
|
+
version = "0.9.65"
|
565
567
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
566
|
-
checksum = "
|
568
|
+
checksum = "007e63597f91c711cbb299e60fecbdb6f5ad4a066d6a20c81943893f1584c895"
|
567
569
|
dependencies = [
|
568
570
|
"bindgen",
|
571
|
+
"lazy_static",
|
572
|
+
"quote",
|
569
573
|
"regex",
|
570
574
|
"shell-words",
|
575
|
+
"syn",
|
571
576
|
]
|
572
577
|
|
573
578
|
[[package]]
|
data/LICENSE-THIRD-PARTY.txt
CHANGED
@@ -154,7 +154,7 @@ magnus v0.5.0
|
|
154
154
|
https://github.com/matsadler/magnus
|
155
155
|
MIT
|
156
156
|
|
157
|
-
magnus-macros v0.
|
157
|
+
magnus-macros v0.4.0
|
158
158
|
https://github.com/matsadler/magnus
|
159
159
|
MIT
|
160
160
|
|
@@ -242,11 +242,11 @@ rayon-core v1.10.2
|
|
242
242
|
https://github.com/rayon-rs/rayon
|
243
243
|
MIT OR Apache-2.0
|
244
244
|
|
245
|
-
rb-sys v0.9.
|
245
|
+
rb-sys v0.9.65
|
246
246
|
https://github.com/oxidize-rb/rb-sys
|
247
247
|
MIT OR Apache-2.0
|
248
248
|
|
249
|
-
rb-sys-build v0.9.
|
249
|
+
rb-sys-build v0.9.65
|
250
250
|
https://github.com/oxidize-rb/rb-sys
|
251
251
|
MIT OR Apache-2.0
|
252
252
|
|
@@ -7795,32 +7795,6 @@ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
7795
7795
|
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
7796
7796
|
SOFTWARE.
|
7797
7797
|
|
7798
|
-
================================================================================
|
7799
|
-
magnus magnus-macros/LICENSE
|
7800
|
-
================================================================================
|
7801
|
-
|
7802
|
-
MIT License
|
7803
|
-
|
7804
|
-
Copyright (c) 2022, 2021 Matthew Sadler
|
7805
|
-
|
7806
|
-
Permission is hereby granted, free of charge, to any person obtaining a copy
|
7807
|
-
of this software and associated documentation files (the "Software"), to deal
|
7808
|
-
in the Software without restriction, including without limitation the rights
|
7809
|
-
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
7810
|
-
copies of the Software, and to permit persons to whom the Software is
|
7811
|
-
furnished to do so, subject to the following conditions:
|
7812
|
-
|
7813
|
-
The above copyright notice and this permission notice shall be included in all
|
7814
|
-
copies or substantial portions of the Software.
|
7815
|
-
|
7816
|
-
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
7817
|
-
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
7818
|
-
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
7819
|
-
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
7820
|
-
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
7821
|
-
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
7822
|
-
SOFTWARE.
|
7823
|
-
|
7824
7798
|
================================================================================
|
7825
7799
|
magnus-macros LICENSE
|
7826
7800
|
================================================================================
|
Binary file
|
Binary file
|
Binary file
|
Binary file
|
data/lib/tokenizers/version.rb
CHANGED
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: tokenizers
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.3.
|
4
|
+
version: 0.3.2
|
5
5
|
platform: arm64-darwin
|
6
6
|
authors:
|
7
7
|
- Andrew Kane
|
8
8
|
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2023-
|
11
|
+
date: 2023-03-07 00:00:00.000000000 Z
|
12
12
|
dependencies: []
|
13
13
|
description:
|
14
14
|
email: andrew@ankane.org
|