tiktoken_ruby 0.0.8 → 0.0.9
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/Cargo.lock +110 -126
- data/Gemfile.lock +4 -4
- data/ext/tiktoken_ruby/Cargo.toml +2 -2
- data/ext/tiktoken_ruby/src/lib.rs +6 -0
- data/lib/tiktoken_ruby/version.rb +1 -1
- data/lib/tiktoken_ruby.rb +4 -1
- data/tiktoken_ruby.gemspec +1 -1
- metadata +6 -6
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: abd5db9516cf5d26ace1790e1267038910af214b3315d157e35df851530b83cb
|
4
|
+
data.tar.gz: 88541080f80f27a52c8a7eb9bd9a2baf4dc3c67af4ba152bc03150ade1c89f72
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: bdba999ff6ee22d57a993e7cbff9f1f95c22540973e7af26a58ded2e49e77c9863daedd936255a86c9722598b8fcc442d746c502d9b295f2758e52774aa8fd7c
|
7
|
+
data.tar.gz: 8917f5a08dbed662c890d0102c9d4be3d24a34d5537804b7ceb563819dd01e36d5b580d5e9f68a20464057620e8f2497558e0e3f1e0faf2afc044d2a4feec7e2
|
data/Cargo.lock
CHANGED
@@ -4,30 +4,30 @@ version = 3
|
|
4
4
|
|
5
5
|
[[package]]
|
6
6
|
name = "aho-corasick"
|
7
|
-
version = "
|
7
|
+
version = "1.1.3"
|
8
8
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
9
|
-
checksum = "
|
9
|
+
checksum = "8e60d3430d3a69478ad0993f19238d2df97c507009a52b3c10addcd7f6bcb916"
|
10
10
|
dependencies = [
|
11
11
|
"memchr",
|
12
12
|
]
|
13
13
|
|
14
14
|
[[package]]
|
15
15
|
name = "anyhow"
|
16
|
-
version = "1.0.
|
16
|
+
version = "1.0.83"
|
17
17
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
18
|
-
checksum = "
|
18
|
+
checksum = "25bdb32cbbdce2b519a9cd7df3a678443100e265d5e25ca763b7572a5104f5f3"
|
19
19
|
|
20
20
|
[[package]]
|
21
21
|
name = "autocfg"
|
22
|
-
version = "1.
|
22
|
+
version = "1.3.0"
|
23
23
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
24
|
-
checksum = "
|
24
|
+
checksum = "0c4b4d0bd25bd0b74681c0ad21497610ce1b7c91b1022cd21c80c6fbdd9476b0"
|
25
25
|
|
26
26
|
[[package]]
|
27
27
|
name = "base64"
|
28
|
-
version = "0.21.
|
28
|
+
version = "0.21.7"
|
29
29
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
30
|
-
checksum = "
|
30
|
+
checksum = "9d297deb1925b89f2ccc13d7635fa0714f12c87adce1c75356b39ca9b7178567"
|
31
31
|
|
32
32
|
[[package]]
|
33
33
|
name = "bindgen"
|
@@ -35,7 +35,7 @@ version = "0.69.4"
|
|
35
35
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
36
36
|
checksum = "a00dc851838a2120612785d195287475a3ac45514741da670b735818822129a0"
|
37
37
|
dependencies = [
|
38
|
-
"bitflags
|
38
|
+
"bitflags",
|
39
39
|
"cexpr",
|
40
40
|
"clang-sys",
|
41
41
|
"itertools",
|
@@ -66,24 +66,17 @@ checksum = "349f9b6a179ed607305526ca489b34ad0a41aed5f7980fa90eb03160b69598fb"
|
|
66
66
|
|
67
67
|
[[package]]
|
68
68
|
name = "bitflags"
|
69
|
-
version = "
|
70
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
71
|
-
checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
|
72
|
-
|
73
|
-
[[package]]
|
74
|
-
name = "bitflags"
|
75
|
-
version = "2.4.0"
|
69
|
+
version = "2.5.0"
|
76
70
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
77
|
-
checksum = "
|
71
|
+
checksum = "cf4b9d6a944f767f8e5e0db018570623c85f3d925ac718db4e06d0187adb21c1"
|
78
72
|
|
79
73
|
[[package]]
|
80
74
|
name = "bstr"
|
81
|
-
version = "1.
|
75
|
+
version = "1.9.1"
|
82
76
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
83
|
-
checksum = "
|
77
|
+
checksum = "05efc5cfd9110c8416e471df0e96702d58690178e206e61b7173706673c93706"
|
84
78
|
dependencies = [
|
85
79
|
"memchr",
|
86
|
-
"once_cell",
|
87
80
|
"regex-automata",
|
88
81
|
"serde",
|
89
82
|
]
|
@@ -105,9 +98,9 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
|
|
105
98
|
|
106
99
|
[[package]]
|
107
100
|
name = "clang-sys"
|
108
|
-
version = "1.
|
101
|
+
version = "1.7.0"
|
109
102
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
110
|
-
checksum = "
|
103
|
+
checksum = "67523a3b4be3ce1989d607a828d036249522dd9c1c8de7f4dd2dae43a37369d1"
|
111
104
|
dependencies = [
|
112
105
|
"glob",
|
113
106
|
"libc",
|
@@ -116,15 +109,15 @@ dependencies = [
|
|
116
109
|
|
117
110
|
[[package]]
|
118
111
|
name = "either"
|
119
|
-
version = "1.
|
112
|
+
version = "1.11.0"
|
120
113
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
121
|
-
checksum = "
|
114
|
+
checksum = "a47c1c47d2f5964e29c61246e81db715514cd532db6b5116a25ea3c03d6780a2"
|
122
115
|
|
123
116
|
[[package]]
|
124
117
|
name = "fancy-regex"
|
125
|
-
version = "0.
|
118
|
+
version = "0.12.0"
|
126
119
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
127
|
-
checksum = "
|
120
|
+
checksum = "7493d4c459da9f84325ad297371a6b2b8a162800873a22e3b6b6512e61d18c05"
|
128
121
|
dependencies = [
|
129
122
|
"bit-set",
|
130
123
|
"regex",
|
@@ -159,25 +152,25 @@ checksum = "830d08ce1d1d941e6b30645f1a0eb5643013d835ce3779a5fc208261dbe10f55"
|
|
159
152
|
|
160
153
|
[[package]]
|
161
154
|
name = "libc"
|
162
|
-
version = "0.2.
|
155
|
+
version = "0.2.154"
|
163
156
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
164
|
-
checksum = "
|
157
|
+
checksum = "ae743338b92ff9146ce83992f766a31066a91a8c84a45e0e9f21e7cf6de6d346"
|
165
158
|
|
166
159
|
[[package]]
|
167
160
|
name = "libloading"
|
168
|
-
version = "0.
|
161
|
+
version = "0.8.3"
|
169
162
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
170
|
-
checksum = "
|
163
|
+
checksum = "0c2a198fb6b0eada2a8df47933734e6d35d350665a33a3593d7164fa52c75c19"
|
171
164
|
dependencies = [
|
172
165
|
"cfg-if",
|
173
|
-
"
|
166
|
+
"windows-targets",
|
174
167
|
]
|
175
168
|
|
176
169
|
[[package]]
|
177
170
|
name = "lock_api"
|
178
|
-
version = "0.4.
|
171
|
+
version = "0.4.12"
|
179
172
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
180
|
-
checksum = "
|
173
|
+
checksum = "07af8b9cdd281b7915f413fa73f29ebd5d55d0d3f0155584dade1ff18cea1b17"
|
181
174
|
dependencies = [
|
182
175
|
"autocfg",
|
183
176
|
"scopeguard",
|
@@ -185,9 +178,9 @@ dependencies = [
|
|
185
178
|
|
186
179
|
[[package]]
|
187
180
|
name = "magnus"
|
188
|
-
version = "0.6.
|
181
|
+
version = "0.6.4"
|
189
182
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
190
|
-
checksum = "
|
183
|
+
checksum = "b1597ef40aa8c36be098249e82c9a20cf7199278ac1c1a1a995eeead6a184479"
|
191
184
|
dependencies = [
|
192
185
|
"magnus-macros",
|
193
186
|
"rb-sys",
|
@@ -208,9 +201,9 @@ dependencies = [
|
|
208
201
|
|
209
202
|
[[package]]
|
210
203
|
name = "memchr"
|
211
|
-
version = "2.
|
204
|
+
version = "2.7.2"
|
212
205
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
213
|
-
checksum = "
|
206
|
+
checksum = "6c8640c5d730cb13ebd907d8d04b52f55ac9a2eec55b440c8892f40d56c76c1d"
|
214
207
|
|
215
208
|
[[package]]
|
216
209
|
name = "minimal-lexical"
|
@@ -228,17 +221,11 @@ dependencies = [
|
|
228
221
|
"minimal-lexical",
|
229
222
|
]
|
230
223
|
|
231
|
-
[[package]]
|
232
|
-
name = "once_cell"
|
233
|
-
version = "1.17.1"
|
234
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
235
|
-
checksum = "b7e5500299e16ebb147ae15a00a942af264cf3688f47923b8fc2cd5858f23ad3"
|
236
|
-
|
237
224
|
[[package]]
|
238
225
|
name = "parking_lot"
|
239
|
-
version = "0.12.
|
226
|
+
version = "0.12.2"
|
240
227
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
241
|
-
checksum = "
|
228
|
+
checksum = "7e4af0ca4f6caed20e900d564c242b8e5d4903fdacf31d3daf527b66fe6f42fb"
|
242
229
|
dependencies = [
|
243
230
|
"lock_api",
|
244
231
|
"parking_lot_core",
|
@@ -246,49 +233,49 @@ dependencies = [
|
|
246
233
|
|
247
234
|
[[package]]
|
248
235
|
name = "parking_lot_core"
|
249
|
-
version = "0.9.
|
236
|
+
version = "0.9.10"
|
250
237
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
251
|
-
checksum = "
|
238
|
+
checksum = "1e401f977ab385c9e4e3ab30627d6f26d00e2c73eef317493c4ec6d468726cf8"
|
252
239
|
dependencies = [
|
253
240
|
"cfg-if",
|
254
241
|
"libc",
|
255
242
|
"redox_syscall",
|
256
243
|
"smallvec",
|
257
|
-
"windows-
|
244
|
+
"windows-targets",
|
258
245
|
]
|
259
246
|
|
260
247
|
[[package]]
|
261
248
|
name = "proc-macro2"
|
262
|
-
version = "1.0.
|
249
|
+
version = "1.0.82"
|
263
250
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
264
|
-
checksum = "
|
251
|
+
checksum = "8ad3d49ab951a01fbaafe34f2ec74122942fe18a3f9814c3268f1bb72042131b"
|
265
252
|
dependencies = [
|
266
253
|
"unicode-ident",
|
267
254
|
]
|
268
255
|
|
269
256
|
[[package]]
|
270
257
|
name = "quote"
|
271
|
-
version = "1.0.
|
258
|
+
version = "1.0.36"
|
272
259
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
273
|
-
checksum = "
|
260
|
+
checksum = "0fa76aaf39101c457836aec0ce2316dbdc3ab723cdda1c6bd4e6ad4208acaca7"
|
274
261
|
dependencies = [
|
275
262
|
"proc-macro2",
|
276
263
|
]
|
277
264
|
|
278
265
|
[[package]]
|
279
266
|
name = "rb-sys"
|
280
|
-
version = "0.9.
|
267
|
+
version = "0.9.97"
|
281
268
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
282
|
-
checksum = "
|
269
|
+
checksum = "47d30bcad206b51f2f66121190ca678dce1fdf3a2eae0ac5d838d1818b19bdf5"
|
283
270
|
dependencies = [
|
284
271
|
"rb-sys-build",
|
285
272
|
]
|
286
273
|
|
287
274
|
[[package]]
|
288
275
|
name = "rb-sys-build"
|
289
|
-
version = "0.9.
|
276
|
+
version = "0.9.97"
|
290
277
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
291
|
-
checksum = "
|
278
|
+
checksum = "3cbd92f281615f3c2dcb9dcb0f0576624752afbf9a7f99173b37c4b55b62dd8a"
|
292
279
|
dependencies = [
|
293
280
|
"bindgen",
|
294
281
|
"lazy_static",
|
@@ -307,35 +294,41 @@ checksum = "a35802679f07360454b418a5d1735c89716bde01d35b1560fc953c1415a0b3bb"
|
|
307
294
|
|
308
295
|
[[package]]
|
309
296
|
name = "redox_syscall"
|
310
|
-
version = "0.
|
297
|
+
version = "0.5.1"
|
311
298
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
312
|
-
checksum = "
|
299
|
+
checksum = "469052894dcb553421e483e4209ee581a45100d31b4018de03e5a7ad86374a7e"
|
313
300
|
dependencies = [
|
314
|
-
"bitflags
|
301
|
+
"bitflags",
|
315
302
|
]
|
316
303
|
|
317
304
|
[[package]]
|
318
305
|
name = "regex"
|
319
|
-
version = "1.
|
306
|
+
version = "1.10.4"
|
320
307
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
321
|
-
checksum = "
|
308
|
+
checksum = "c117dbdfde9c8308975b6a18d71f3f385c89461f7b3fb054288ecf2a2058ba4c"
|
322
309
|
dependencies = [
|
323
310
|
"aho-corasick",
|
324
311
|
"memchr",
|
312
|
+
"regex-automata",
|
325
313
|
"regex-syntax",
|
326
314
|
]
|
327
315
|
|
328
316
|
[[package]]
|
329
317
|
name = "regex-automata"
|
330
|
-
version = "0.
|
318
|
+
version = "0.4.6"
|
331
319
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
332
|
-
checksum = "
|
320
|
+
checksum = "86b83b8b9847f9bf95ef68afb0b8e6cdb80f498442f5179a29fad448fcc1eaea"
|
321
|
+
dependencies = [
|
322
|
+
"aho-corasick",
|
323
|
+
"memchr",
|
324
|
+
"regex-syntax",
|
325
|
+
]
|
333
326
|
|
334
327
|
[[package]]
|
335
328
|
name = "regex-syntax"
|
336
|
-
version = "0.
|
329
|
+
version = "0.8.3"
|
337
330
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
338
|
-
checksum = "
|
331
|
+
checksum = "adad44e29e4c806119491a7f06f03de4d1af22c3a680dd47f1e6e179439d1f56"
|
339
332
|
|
340
333
|
[[package]]
|
341
334
|
name = "rustc-hash"
|
@@ -345,9 +338,9 @@ checksum = "08d43f7aa6b08d49f382cde6a7982047c3426db949b1424bc4b7ec9ae12c6ce2"
|
|
345
338
|
|
346
339
|
[[package]]
|
347
340
|
name = "scopeguard"
|
348
|
-
version = "1.
|
341
|
+
version = "1.2.0"
|
349
342
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
350
|
-
checksum = "
|
343
|
+
checksum = "94143f37725109f92c262ed2cf5e59bce7498c01bcc1502d7b9afe439a4e9f49"
|
351
344
|
|
352
345
|
[[package]]
|
353
346
|
name = "seq-macro"
|
@@ -357,9 +350,23 @@ checksum = "a3f0bf26fd526d2a95683cd0f87bf103b8539e2ca1ef48ce002d67aad59aa0b4"
|
|
357
350
|
|
358
351
|
[[package]]
|
359
352
|
name = "serde"
|
360
|
-
version = "1.0.
|
353
|
+
version = "1.0.202"
|
361
354
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
362
|
-
checksum = "
|
355
|
+
checksum = "226b61a0d411b2ba5ff6d7f73a476ac4f8bb900373459cd00fab8512828ba395"
|
356
|
+
dependencies = [
|
357
|
+
"serde_derive",
|
358
|
+
]
|
359
|
+
|
360
|
+
[[package]]
|
361
|
+
name = "serde_derive"
|
362
|
+
version = "1.0.202"
|
363
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
364
|
+
checksum = "6048858004bcff69094cd972ed40a32500f153bd3be9f716b2eed2e8217c4838"
|
365
|
+
dependencies = [
|
366
|
+
"proc-macro2",
|
367
|
+
"quote",
|
368
|
+
"syn",
|
369
|
+
]
|
363
370
|
|
364
371
|
[[package]]
|
365
372
|
name = "shell-words"
|
@@ -369,21 +376,21 @@ checksum = "24188a676b6ae68c3b2cb3a01be17fbf7240ce009799bb56d5b1409051e78fde"
|
|
369
376
|
|
370
377
|
[[package]]
|
371
378
|
name = "shlex"
|
372
|
-
version = "1.
|
379
|
+
version = "1.3.0"
|
373
380
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
374
|
-
checksum = "
|
381
|
+
checksum = "0fda2ff0d084019ba4d7c6f371c95d8fd75ce3524c3cb8fb653a3023f6323e64"
|
375
382
|
|
376
383
|
[[package]]
|
377
384
|
name = "smallvec"
|
378
|
-
version = "1.
|
385
|
+
version = "1.13.2"
|
379
386
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
380
|
-
checksum = "
|
387
|
+
checksum = "3c5e1a9a646d36c3599cd173a41282daf47c44583ad367b8e6837255952e5c67"
|
381
388
|
|
382
389
|
[[package]]
|
383
390
|
name = "syn"
|
384
|
-
version = "2.0.
|
391
|
+
version = "2.0.63"
|
385
392
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
386
|
-
checksum = "
|
393
|
+
checksum = "bf5be731623ca1a1fb7d8be6f261a3be6d3e2337b8a1f97be944d020c8fcb704"
|
387
394
|
dependencies = [
|
388
395
|
"proc-macro2",
|
389
396
|
"quote",
|
@@ -392,8 +399,9 @@ dependencies = [
|
|
392
399
|
|
393
400
|
[[package]]
|
394
401
|
name = "tiktoken-rs"
|
395
|
-
version = "0.
|
396
|
-
source = "
|
402
|
+
version = "0.5.9"
|
403
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
404
|
+
checksum = "c314e7ce51440f9e8f5a497394682a57b7c323d0f4d0a6b1b13c429056e0e234"
|
397
405
|
dependencies = [
|
398
406
|
"anyhow",
|
399
407
|
"base64",
|
@@ -415,50 +423,20 @@ dependencies = [
|
|
415
423
|
|
416
424
|
[[package]]
|
417
425
|
name = "unicode-ident"
|
418
|
-
version = "1.0.
|
426
|
+
version = "1.0.12"
|
419
427
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
420
|
-
checksum = "
|
421
|
-
|
422
|
-
[[package]]
|
423
|
-
name = "winapi"
|
424
|
-
version = "0.3.9"
|
425
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
426
|
-
checksum = "5c839a674fcd7a98952e593242ea400abe93992746761e38641405d28b00f419"
|
427
|
-
dependencies = [
|
428
|
-
"winapi-i686-pc-windows-gnu",
|
429
|
-
"winapi-x86_64-pc-windows-gnu",
|
430
|
-
]
|
431
|
-
|
432
|
-
[[package]]
|
433
|
-
name = "winapi-i686-pc-windows-gnu"
|
434
|
-
version = "0.4.0"
|
435
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
436
|
-
checksum = "ac3b87c63620426dd9b991e5ce0329eff545bccbbb34f3be09ff6fb6ab51b7b6"
|
437
|
-
|
438
|
-
[[package]]
|
439
|
-
name = "winapi-x86_64-pc-windows-gnu"
|
440
|
-
version = "0.4.0"
|
441
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
442
|
-
checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
|
443
|
-
|
444
|
-
[[package]]
|
445
|
-
name = "windows-sys"
|
446
|
-
version = "0.45.0"
|
447
|
-
source = "registry+https://github.com/rust-lang/crates.io-index"
|
448
|
-
checksum = "75283be5efb2831d37ea142365f009c02ec203cd29a3ebecbc093d52315b66d0"
|
449
|
-
dependencies = [
|
450
|
-
"windows-targets",
|
451
|
-
]
|
428
|
+
checksum = "3354b9ac3fae1ff6755cb6db53683adb661634f67557942dea4facebec0fee4b"
|
452
429
|
|
453
430
|
[[package]]
|
454
431
|
name = "windows-targets"
|
455
|
-
version = "0.
|
432
|
+
version = "0.52.5"
|
456
433
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
457
|
-
checksum = "
|
434
|
+
checksum = "6f0713a46559409d202e70e28227288446bf7841d3211583a4b53e3f6d96e7eb"
|
458
435
|
dependencies = [
|
459
436
|
"windows_aarch64_gnullvm",
|
460
437
|
"windows_aarch64_msvc",
|
461
438
|
"windows_i686_gnu",
|
439
|
+
"windows_i686_gnullvm",
|
462
440
|
"windows_i686_msvc",
|
463
441
|
"windows_x86_64_gnu",
|
464
442
|
"windows_x86_64_gnullvm",
|
@@ -467,42 +445,48 @@ dependencies = [
|
|
467
445
|
|
468
446
|
[[package]]
|
469
447
|
name = "windows_aarch64_gnullvm"
|
470
|
-
version = "0.
|
448
|
+
version = "0.52.5"
|
471
449
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
472
|
-
checksum = "
|
450
|
+
checksum = "7088eed71e8b8dda258ecc8bac5fb1153c5cffaf2578fc8ff5d61e23578d3263"
|
473
451
|
|
474
452
|
[[package]]
|
475
453
|
name = "windows_aarch64_msvc"
|
476
|
-
version = "0.
|
454
|
+
version = "0.52.5"
|
477
455
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
478
|
-
checksum = "
|
456
|
+
checksum = "9985fd1504e250c615ca5f281c3f7a6da76213ebd5ccc9561496568a2752afb6"
|
479
457
|
|
480
458
|
[[package]]
|
481
459
|
name = "windows_i686_gnu"
|
482
|
-
version = "0.
|
460
|
+
version = "0.52.5"
|
461
|
+
source = "registry+https://github.com/rust-lang/crates.io-index"
|
462
|
+
checksum = "88ba073cf16d5372720ec942a8ccbf61626074c6d4dd2e745299726ce8b89670"
|
463
|
+
|
464
|
+
[[package]]
|
465
|
+
name = "windows_i686_gnullvm"
|
466
|
+
version = "0.52.5"
|
483
467
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
484
|
-
checksum = "
|
468
|
+
checksum = "87f4261229030a858f36b459e748ae97545d6f1ec60e5e0d6a3d32e0dc232ee9"
|
485
469
|
|
486
470
|
[[package]]
|
487
471
|
name = "windows_i686_msvc"
|
488
|
-
version = "0.
|
472
|
+
version = "0.52.5"
|
489
473
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
490
|
-
checksum = "
|
474
|
+
checksum = "db3c2bf3d13d5b658be73463284eaf12830ac9a26a90c717b7f771dfe97487bf"
|
491
475
|
|
492
476
|
[[package]]
|
493
477
|
name = "windows_x86_64_gnu"
|
494
|
-
version = "0.
|
478
|
+
version = "0.52.5"
|
495
479
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
496
|
-
checksum = "
|
480
|
+
checksum = "4e4246f76bdeff09eb48875a0fd3e2af6aada79d409d33011886d3e1581517d9"
|
497
481
|
|
498
482
|
[[package]]
|
499
483
|
name = "windows_x86_64_gnullvm"
|
500
|
-
version = "0.
|
484
|
+
version = "0.52.5"
|
501
485
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
502
|
-
checksum = "
|
486
|
+
checksum = "852298e482cd67c356ddd9570386e2862b5673c85bd5f88df9ab6802b334c596"
|
503
487
|
|
504
488
|
[[package]]
|
505
489
|
name = "windows_x86_64_msvc"
|
506
|
-
version = "0.
|
490
|
+
version = "0.52.5"
|
507
491
|
source = "registry+https://github.com/rust-lang/crates.io-index"
|
508
|
-
checksum = "
|
492
|
+
checksum = "bec47e5bfd1bff0eeaf6d8b485cc1074891a197ab4225d504cb7a1ab88b02bf0"
|
data/Gemfile.lock
CHANGED
@@ -1,8 +1,8 @@
|
|
1
1
|
PATH
|
2
2
|
remote: .
|
3
3
|
specs:
|
4
|
-
tiktoken_ruby (0.0.
|
5
|
-
rb_sys (
|
4
|
+
tiktoken_ruby (0.0.9)
|
5
|
+
rb_sys (= 0.9.87)
|
6
6
|
|
7
7
|
GEM
|
8
8
|
remote: https://rubygems.org/
|
@@ -22,7 +22,7 @@ GEM
|
|
22
22
|
rake (13.1.0)
|
23
23
|
rake-compiler (1.2.5)
|
24
24
|
rake
|
25
|
-
rb_sys (0.9.
|
25
|
+
rb_sys (0.9.87)
|
26
26
|
regexp_parser (2.9.0)
|
27
27
|
rexml (3.2.6)
|
28
28
|
rspec (3.12.0)
|
@@ -89,4 +89,4 @@ DEPENDENCIES
|
|
89
89
|
yard-doctest
|
90
90
|
|
91
91
|
BUNDLED WITH
|
92
|
-
2.4.
|
92
|
+
2.4.4
|
@@ -11,5 +11,5 @@ crate-type = ["cdylib"]
|
|
11
11
|
|
12
12
|
[dependencies]
|
13
13
|
magnus = { version = "0.6.1" }
|
14
|
-
rb-sys = { version = "
|
15
|
-
tiktoken-rs = {
|
14
|
+
rb-sys = { version = "0.9.87", features = ["stable-api-compiled-fallback"] }
|
15
|
+
tiktoken-rs = { version = "0.5.9" }
|
@@ -20,6 +20,11 @@ fn cl100k_base() -> CoreBPEWrapper {
|
|
20
20
|
CoreBPEWrapper::new(core_bpe)
|
21
21
|
}
|
22
22
|
|
23
|
+
fn o200k_base() -> CoreBPEWrapper {
|
24
|
+
let core_bpe = tiktoken_rs::o200k_base().unwrap();
|
25
|
+
CoreBPEWrapper::new(core_bpe)
|
26
|
+
}
|
27
|
+
|
23
28
|
fn module() -> Result<RModule, magnus::Error> {
|
24
29
|
define_module("Tiktoken")
|
25
30
|
}
|
@@ -37,6 +42,7 @@ fn init() -> Result<(), Error> {
|
|
37
42
|
factory_module.define_singleton_method("p50k_base", function!(p50k_base, 0))?;
|
38
43
|
factory_module.define_singleton_method("p50k_edit", function!(p50k_edit, 0))?;
|
39
44
|
factory_module.define_singleton_method("cl100k_base", function!(cl100k_base, 0))?;
|
45
|
+
factory_module.define_singleton_method("o200k_base", function!(o200k_base, 0))?;
|
40
46
|
|
41
47
|
let ext_module = module.define_module("Ext")?;
|
42
48
|
let bpe_class = ext_module.define_class("CoreBPE", class::object())?;
|
data/lib/tiktoken_ruby.rb
CHANGED
@@ -64,13 +64,15 @@ module Tiktoken
|
|
64
64
|
:r50k_base,
|
65
65
|
:p50k_base,
|
66
66
|
:p50k_edit,
|
67
|
-
:cl100k_base
|
67
|
+
:cl100k_base,
|
68
|
+
:o200k_base
|
68
69
|
]
|
69
70
|
|
70
71
|
# taken from the python library here https://github.com/openai/tiktoken/blob/main/tiktoken/model.py
|
71
72
|
# that is also MIT licensed but by OpenAI
|
72
73
|
MODEL_TO_ENCODING_NAME = {
|
73
74
|
# chat
|
75
|
+
"gpt-4o": "o200k_base",
|
74
76
|
"gpt-4": "cl100k_base",
|
75
77
|
"gpt-3.5-turbo": "cl100k_base",
|
76
78
|
"gpt-35-turbo": "cl100k_base", # Azure deployment name
|
@@ -120,6 +122,7 @@ module Tiktoken
|
|
120
122
|
|
121
123
|
MODEL_PREFIX_TO_ENCODING = {
|
122
124
|
# chat
|
125
|
+
"gpt-4o-": "o200k_base", # e.g., gpt-4o-2024-05-13, etc.
|
123
126
|
"gpt-4-": "cl100k_base", # e.g., gpt-4-0314, etc., plus gpt-4-32k
|
124
127
|
"gpt-3.5-turbo-": "cl100k_base", # e.g, gpt-3.5-turbo-0301, -0401, etc.
|
125
128
|
"gpt-35-turbo-": "cl100k_base", # Azure deployment name
|
data/tiktoken_ruby.gemspec
CHANGED
@@ -29,5 +29,5 @@ Gem::Specification.new do |spec|
|
|
29
29
|
spec.executables = spec.files.grep(%r{\Aexe/}) { |f| File.basename(f) }
|
30
30
|
spec.require_paths = ["lib"]
|
31
31
|
spec.extensions = ["ext/tiktoken_ruby/extconf.rb"]
|
32
|
-
spec.add_dependency "rb_sys", "
|
32
|
+
spec.add_dependency "rb_sys", "= 0.9.87"
|
33
33
|
end
|
metadata
CHANGED
@@ -1,29 +1,29 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: tiktoken_ruby
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.0.
|
4
|
+
version: 0.0.9
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- IAPark
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2024-
|
11
|
+
date: 2024-05-16 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: rb_sys
|
15
15
|
requirement: !ruby/object:Gem::Requirement
|
16
16
|
requirements:
|
17
|
-
- -
|
17
|
+
- - '='
|
18
18
|
- !ruby/object:Gem::Version
|
19
|
-
version: 0.9.
|
19
|
+
version: 0.9.87
|
20
20
|
type: :runtime
|
21
21
|
prerelease: false
|
22
22
|
version_requirements: !ruby/object:Gem::Requirement
|
23
23
|
requirements:
|
24
|
-
- -
|
24
|
+
- - '='
|
25
25
|
- !ruby/object:Gem::Version
|
26
|
-
version: 0.9.
|
26
|
+
version: 0.9.87
|
27
27
|
description: An unofficial Ruby wrapper for Tiktoken, a BPE tokenizer written by and
|
28
28
|
used by OpenAI. It can be used to count the number of tokens in text before sending
|
29
29
|
it to OpenAI APIs.
|