tiktoken_ruby 0.0.8-x86_64-linux → 0.0.9-x86_64-linux
Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: b2981777cb81fd3fade2688e66f0f6711c19956a3737b834fa1db1a1c0e2aabe
|
4
|
+
data.tar.gz: fbbac592954875ceb1c469f8266e3b69a845a3a960c8f1de7e45c2b0cf2dd74c
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 603c244d51c2254f15ab748ccade9f2dd3a5ebaa04b4e02119636a23901d3b24103231473ee97ccab36b82a19234a111312cad8919a5b1477638e592b6aa059b
|
7
|
+
data.tar.gz: cdf87538056946d3799027098b2ce43a3134d419513c0ad7f69db5ee6014c4bade22ab6e5d006537a1b6fb0e6ab86d88b1be39ef16babdd18d4e0e37545f71b2
|
data/Gemfile.lock
CHANGED
Binary file
|
Binary file
|
Binary file
|
data/lib/tiktoken_ruby.rb
CHANGED
@@ -64,13 +64,15 @@ module Tiktoken
|
|
64
64
|
:r50k_base,
|
65
65
|
:p50k_base,
|
66
66
|
:p50k_edit,
|
67
|
-
:cl100k_base
|
67
|
+
:cl100k_base,
|
68
|
+
:o200k_base
|
68
69
|
]
|
69
70
|
|
70
71
|
# taken from the python library here https://github.com/openai/tiktoken/blob/main/tiktoken/model.py
|
71
72
|
# that is also MIT licensed but by OpenAI
|
72
73
|
MODEL_TO_ENCODING_NAME = {
|
73
74
|
# chat
|
75
|
+
"gpt-4o": "o200k_base",
|
74
76
|
"gpt-4": "cl100k_base",
|
75
77
|
"gpt-3.5-turbo": "cl100k_base",
|
76
78
|
"gpt-35-turbo": "cl100k_base", # Azure deployment name
|
@@ -120,6 +122,7 @@ module Tiktoken
|
|
120
122
|
|
121
123
|
MODEL_PREFIX_TO_ENCODING = {
|
122
124
|
# chat
|
125
|
+
"gpt-4o-": "o200k_base", # e.g., gpt-4o-2024-05-13, etc.
|
123
126
|
"gpt-4-": "cl100k_base", # e.g., gpt-4-0314, etc., plus gpt-4-32k
|
124
127
|
"gpt-3.5-turbo-": "cl100k_base", # e.g, gpt-3.5-turbo-0301, -0401, etc.
|
125
128
|
"gpt-35-turbo-": "cl100k_base", # Azure deployment name
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: tiktoken_ruby
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.0.
|
4
|
+
version: 0.0.9
|
5
5
|
platform: x86_64-linux
|
6
6
|
authors:
|
7
7
|
- IAPark
|
8
8
|
autorequire:
|
9
9
|
bindir: exe
|
10
10
|
cert_chain: []
|
11
|
-
date: 2024-
|
11
|
+
date: 2024-05-16 00:00:00.000000000 Z
|
12
12
|
dependencies: []
|
13
13
|
description: An unofficial Ruby wrapper for Tiktoken, a BPE tokenizer written by and
|
14
14
|
used by OpenAI. It can be used to count the number of tokens in text before sending
|