tokenizers 0.5.2-aarch64-linux → 0.5.3-aarch64-linux

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 3b8639c894fdb33fdb9741593827cc8c4f00df954be28c56f954b202f082b7fd
4
- data.tar.gz: 86bf064a1a6b29a75d6b8d400a8bb7a8de1178bc291f62a3c7d52f11a3412127
3
+ metadata.gz: 47d332c64421a4b5fe51e275f516a0c90fa813c7a886508c0139bc5a7701b51e
4
+ data.tar.gz: a61c6afd92fbb39e5d2322881ae286283fcc6d0ddb937c3e9fe5d72852ce89d7
5
5
  SHA512:
6
- metadata.gz: bafc8c988420672150b4584378da5f4ebdac3ac9698dd9bc6d53e798a0c064e54aacc7d235c278f73c00e51e3d5d35d5e08232cb92db9f4e9fc50967df4fb075
7
- data.tar.gz: 4afb2e39c3c6d8add55b58af240d1ff1473788cab7530c0b16dd826561520784da15bd5553313cf07574171362c41681880a622bc1910280045a2d28ec2abee4
6
+ metadata.gz: f22f69721315fddd021b683904ef9176b6eea7597641328663db38045184bc6fff7b681e1fb6e4c641a103c42a7fe0d1d74dad30437aab376be7f72633a1e3d8
7
+ data.tar.gz: 1f2693463436f58f6865160e96a9983725bf7998fc1f99d3853d1bb86012e97bb753faf9671546e8753193e721054a4fe8d186e8839cfe70801090ce6dfc83ff
data/CHANGELOG.md CHANGED
@@ -1,3 +1,8 @@
1
+ ## 0.5.3 (2024-09-17)
2
+
3
+ - Added `AddedToken` class
4
+ - Added precompiled gem for Windows
5
+
1
6
  ## 0.5.2 (2024-08-26)
2
7
 
3
8
  - Added `from_str` method to `Tokenizer`
data/Cargo.lock CHANGED
@@ -724,7 +724,7 @@ dependencies = [
724
724
 
725
725
  [[package]]
726
726
  name = "tokenizers"
727
- version = "0.5.2"
727
+ version = "0.5.3"
728
728
  dependencies = [
729
729
  "magnus",
730
730
  "onig",
Binary file
Binary file
Binary file
@@ -0,0 +1,7 @@
1
+ module Tokenizers
2
+ class AddedToken
3
+ def self.new(content, **kwargs)
4
+ _new(content, kwargs)
5
+ end
6
+ end
7
+ end
@@ -1,3 +1,3 @@
1
1
  module Tokenizers
2
- VERSION = "0.5.2"
2
+ VERSION = "0.5.3"
3
3
  end
data/lib/tokenizers.rb CHANGED
@@ -42,6 +42,7 @@ require_relative "tokenizers/trainers/word_level_trainer"
42
42
  require_relative "tokenizers/trainers/word_piece_trainer"
43
43
 
44
44
  # other
45
+ require_relative "tokenizers/added_token"
45
46
  require_relative "tokenizers/char_bpe_tokenizer"
46
47
  require_relative "tokenizers/encoding"
47
48
  require_relative "tokenizers/from_pretrained"
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: tokenizers
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.5.2
4
+ version: 0.5.3
5
5
  platform: aarch64-linux
6
6
  authors:
7
7
  - Andrew Kane
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2024-08-26 00:00:00.000000000 Z
11
+ date: 2024-09-17 00:00:00.000000000 Z
12
12
  dependencies: []
13
13
  description:
14
14
  email: andrew@ankane.org
@@ -26,6 +26,7 @@ files:
26
26
  - lib/tokenizers/3.1/tokenizers.so
27
27
  - lib/tokenizers/3.2/tokenizers.so
28
28
  - lib/tokenizers/3.3/tokenizers.so
29
+ - lib/tokenizers/added_token.rb
29
30
  - lib/tokenizers/char_bpe_tokenizer.rb
30
31
  - lib/tokenizers/decoders/bpe_decoder.rb
31
32
  - lib/tokenizers/decoders/ctc.rb