npm - ai-token-estimator - Versions diffs - 1.0.2 → 1.1.0 - Mend

ai-token-estimator 1.0.2 → 1.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/README.md CHANGED Viewed

@@ -39,6 +39,29 @@ console.log(getAvailableModels());
 // ['gpt-5.2', 'gpt-4o', 'claude-opus-4.5', 'gemini-3-pro', ...]
 ```
+## Exact OpenAI tokenization (BPE)
+This package includes **exact tokenization for OpenAI models** using a tiktoken-compatible BPE tokenizer (via `gpt-tokenizer`).
+Notes:
+- Encodings are **lazy-loaded on first use** (one-time cost per encoding).
+- Exact tokenization is **slower** than heuristic estimation; `estimate()` defaults to `'heuristic'` to keep existing behavior fast.
+- `encode` / `decode` and `estimate({ tokenizer: 'openai_exact' })` require **Node.js** (uses `node:module` under the hood).
+```ts
+import { encode, decode } from 'ai-token-estimator';
+const text = 'Hello, world!';
+const tokens = encode(text, { model: 'gpt-5.1' }); // exact OpenAI token IDs
+const roundTrip = decode(tokens, { model: 'gpt-5.1' });
+console.log(tokens.length);
+console.log(roundTrip); // "Hello, world!"
+```
+Supported encodings:
+`r50k_base`, `p50k_base`, `p50k_edit`, `cl100k_base`, `o200k_base`, `o200k_harmony`
 ## API Reference
 ### `estimate(input: EstimateInput): EstimateOutput`
@@ -52,6 +75,7 @@ interface EstimateInput {
   text: string;           // The text to estimate tokens for
   model: string;          // Model ID (e.g., 'gpt-4o', 'claude-opus-4.5')
   rounding?: 'ceil' | 'round' | 'floor';  // Rounding strategy (default: 'ceil')
+  tokenizer?: 'heuristic' | 'openai_exact' | 'auto'; // Token counting strategy (default: 'heuristic')
 }
 ```
@@ -64,13 +88,36 @@ interface EstimateOutput {
   estimatedTokens: number; // Estimated token count (integer)
   estimatedInputCost: number; // Estimated cost in USD
   charsPerToken: number;   // The ratio used for this model
+  tokenizerMode?: 'heuristic' | 'openai_exact' | 'auto'; // Which strategy was used
+  encodingUsed?: string;   // OpenAI encoding when using exact tokenization
 }
 ```
+### `countTokens(input: TokenCountInput): TokenCountOutput`
+Counts tokens for a given model:
+- OpenAI models: **exact** BPE tokenization
+- Other providers: heuristic estimate
+```ts
+import { countTokens } from 'ai-token-estimator';
+const result = countTokens({ text: 'Hello, world!', model: 'gpt-5.1' });
+// { tokens: 4, exact: true, encoding: 'o200k_base' }
+```
 ### `getAvailableModels(): string[]`
 Returns an array of all supported model IDs.
+### `encode(text: string, options?: EncodeOptions): number[]`
+Encodes text into **OpenAI token IDs** using tiktoken-compatible BPE tokenization.
+### `decode(tokens: Iterable<number>, options?: { encoding?: OpenAIEncoding; model?: string }): string`
+Decodes OpenAI token IDs back into text using the selected encoding/model.
 ### `getModelConfig(model: string): ModelConfig`
 Returns the configuration for a specific model. Throws if the model is not found.
@@ -108,6 +155,14 @@ This package counts Unicode code points, not UTF-16 code units. This means:
 - Accented characters count correctly
 - Most source code characters count as 1
+## Benchmarks (repo only)
+This repository includes a small benchmark script to compare heuristic vs exact OpenAI tokenization:
+```bash
+npm run benchmark:tokenizer
+```
 <!-- SUPPORTED_MODELS_START -->
 ## Supported Models
@@ -117,20 +172,70 @@ This package counts Unicode code points, not UTF-16 code units. This means:
 | Model | Chars/Token | Input Cost (per 1M tokens) |
 |-------|-------------|---------------------------|
-| gpt-4.1 | 4 | $3.00 |
+| babbage-002 | 4 | $0.40 |
+| chatgpt-4o-latest | 4 | $5.00 |
+| chatgpt-image-latest | 4 | $5.00 |
+| codex-mini-latest | 4 | $1.50 |
+| computer-use-preview | 4 | $3.00 |
+| davinci-002 | 4 | $2.00 |
+| gpt-3.5-0301 | 4 | $1.50 |
+| gpt-3.5-turbo | 4 | $0.50 |
+| gpt-3.5-turbo-0125 | 4 | $0.50 |
+| gpt-3.5-turbo-0613 | 4 | $1.50 |
+| gpt-3.5-turbo-1106 | 4 | $1.00 |
+| gpt-3.5-turbo-16k-0613 | 4 | $3.00 |
+| gpt-3.5-turbo-instruct | 4 | $1.50 |
+| gpt-4-0125-preview | 4 | $10.00 |
+| gpt-4-0314 | 4 | $30.00 |
+| gpt-4-0613 | 4 | $30.00 |
+| gpt-4-1106-preview | 4 | $10.00 |
+| gpt-4-1106-vision-preview | 4 | $10.00 |
+| gpt-4-32k | 4 | $60.00 |
+| gpt-4-turbo-2024-04-09 | 4 | $10.00 |
+| gpt-4.1 | 4 | $2.00 |
 | gpt-4.1-mini | 4 | $0.40 |
 | gpt-4.1-nano | 4 | $0.10 |
 | gpt-4o | 4 | $2.50 |
+| gpt-4o-2024-05-13 | 4 | $5.00 |
+| gpt-4o-audio-preview | 4 | $2.50 |
 | gpt-4o-mini | 4 | $0.15 |
+| gpt-4o-mini-audio-preview | 4 | $0.15 |
+| gpt-4o-mini-realtime-preview | 4 | $0.60 |
+| gpt-4o-mini-search-preview | 4 | $0.15 |
+| gpt-4o-realtime-preview | 4 | $5.00 |
+| gpt-4o-search-preview | 4 | $2.50 |
+| gpt-5 | 4 | $1.25 |
+| gpt-5-chat-latest | 4 | $1.25 |
+| gpt-5-codex | 4 | $1.25 |
 | gpt-5-mini | 4 | $0.25 |
+| gpt-5-nano | 4 | $0.05 |
+| gpt-5-pro | 4 | $15.00 |
+| gpt-5-search-api | 4 | $1.25 |
+| gpt-5.1 | 4 | $1.25 |
+| gpt-5.1-chat-latest | 4 | $1.25 |
+| gpt-5.1-codex | 4 | $1.25 |
+| gpt-5.1-codex-max | 4 | $1.25 |
+| gpt-5.1-codex-mini | 4 | $0.25 |
 | gpt-5.2 | 4 | $1.75 |
+| gpt-5.2-chat-latest | 4 | $1.75 |
+| gpt-5.2-codex | 4 | $1.75 |
 | gpt-5.2-pro | 4 | $21.00 |
+| gpt-audio | 4 | $2.50 |
+| gpt-audio-mini | 4 | $0.60 |
+| gpt-image-1 | 4 | $5.00 |
+| gpt-image-1-mini | 4 | $2.00 |
+| gpt-image-1.5 | 4 | $5.00 |
 | gpt-realtime | 4 | $4.00 |
 | gpt-realtime-mini | 4 | $0.60 |
 | o1 | 4 | $15.00 |
+| o1-mini | 4 | $1.10 |
 | o1-pro | 4 | $150.00 |
 | o3 | 4 | $2.00 |
-| o4-mini | 4 | $4.00 |
+| o3-deep-research | 4 | $10.00 |
+| o3-mini | 4 | $1.10 |
+| o3-pro | 4 | $20.00 |
+| o4-mini | 4 | $1.10 |
+| o4-mini-deep-research | 4 | $2.00 |
 ### Anthropic Claude Models
@@ -164,13 +269,13 @@ This package counts Unicode code points, not UTF-16 code units. This means:
 | gemini-3-flash | 4 | $0.50 |
 | gemini-3-pro | 4 | $2.00 |
-*Last updated: 2025-12-25*
+*Last updated: 2026-01-14*
 <!-- SUPPORTED_MODELS_END -->
 ## Pricing Updates
 Model pricing is automatically updated weekly via GitHub Actions. The update script fetches the latest prices directly from:
-- [OpenAI Pricing](https://openai.com/api/pricing/)
+- [OpenAI Pricing](https://platform.openai.com/docs/pricing)
 - [Anthropic Pricing](https://www.anthropic.com/pricing)
 - [Google AI Pricing](https://ai.google.dev/gemini-api/docs/pricing)
@@ -178,7 +283,7 @@ You can check when prices were last updated:
 ```typescript
 import { LAST_UPDATED } from 'ai-token-estimator';
-console.log(LAST_UPDATED); // '2025-12-25'
+console.log(LAST_UPDATED); // e.g. '2026-01-14'
 ```
 ## License

package/dist/index.cjs CHANGED Viewed

@@ -22,6 +22,9 @@ var index_exports = {};
 __export(index_exports, {
   DEFAULT_MODELS: () => DEFAULT_MODELS,
   LAST_UPDATED: () => LAST_UPDATED,
+  countTokens: () => countTokens,
+  decode: () => decode,
+  encode: () => encode,
   estimate: () => estimate,
   getAvailableModels: () => getAvailableModels,
   getModelConfig: () => getModelConfig
@@ -29,44 +32,224 @@ __export(index_exports, {
 module.exports = __toCommonJS(index_exports);
 // src/models.ts
-var LAST_UPDATED = "2025-12-25";
+var LAST_UPDATED = "2026-01-14";
 var models = {
   // ===================
   // OpenAI Models
   // ===================
   // OpenAI uses ~4 chars per token for English text
-  "gpt-4.1": {
+  "babbage-002": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.4
+  },
+  "chatgpt-4o-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "chatgpt-image-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "codex-mini-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "computer-use-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 3
+  },
+  "davinci-002": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
+  "gpt-3.5-0301": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-3.5-turbo": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.5
+  },
+  "gpt-3.5-turbo-0125": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.5
+  },
+  "gpt-3.5-turbo-0613": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-3.5-turbo-1106": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1
+  },
+  "gpt-3.5-turbo-16k-0613": {
     charsPerToken: 4,
     inputCostPerMillion: 3
   },
+  "gpt-3.5-turbo-instruct": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-4-0125-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-0314": {
+    charsPerToken: 4,
+    inputCostPerMillion: 30
+  },
+  "gpt-4-0613": {
+    charsPerToken: 4,
+    inputCostPerMillion: 30
+  },
+  "gpt-4-1106-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-1106-vision-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-32k": {
+    charsPerToken: 4,
+    inputCostPerMillion: 60
+  },
+  "gpt-4-turbo-2024-04-09": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4.1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
   "gpt-4.1-mini": {
     charsPerToken: 4,
-    inputCostPerMillion: 0.8
+    inputCostPerMillion: 0.4
   },
   "gpt-4.1-nano": {
     charsPerToken: 4,
-    inputCostPerMillion: 0.2
+    inputCostPerMillion: 0.1
   },
   "gpt-4o": {
     charsPerToken: 4,
     inputCostPerMillion: 2.5
   },
+  "gpt-4o-2024-05-13": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-4o-audio-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
   "gpt-4o-mini": {
     charsPerToken: 4,
     inputCostPerMillion: 0.15
   },
+  "gpt-4o-mini-audio-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.15
+  },
+  "gpt-4o-mini-realtime-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.6
+  },
+  "gpt-4o-mini-search-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.15
+  },
+  "gpt-4o-realtime-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-4o-search-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
+  "gpt-5": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
   "gpt-5-mini": {
     charsPerToken: 4,
     inputCostPerMillion: 0.25
   },
+  "gpt-5-nano": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.05
+  },
+  "gpt-5-pro": {
+    charsPerToken: 4,
+    inputCostPerMillion: 15
+  },
+  "gpt-5-search-api": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex-max": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.25
+  },
+  "gpt-5-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
   "gpt-5.2": {
     charsPerToken: 4,
     inputCostPerMillion: 1.75
   },
+  "gpt-5.2-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.75
+  },
+  "gpt-5.2-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.75
+  },
   "gpt-5.2-pro": {
     charsPerToken: 4,
     inputCostPerMillion: 21
   },
+  "gpt-audio": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
+  "gpt-audio-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.6
+  },
+  "gpt-image-1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-image-1-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
+  "gpt-image-1.5": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
   "gpt-realtime": {
     charsPerToken: 4,
     inputCostPerMillion: 4
@@ -79,6 +262,10 @@ var models = {
     charsPerToken: 4,
     inputCostPerMillion: 15
   },
+  "o1-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.1
+  },
   "o1-pro": {
     charsPerToken: 4,
     inputCostPerMillion: 150
@@ -87,9 +274,25 @@ var models = {
     charsPerToken: 4,
     inputCostPerMillion: 2
   },
+  "o3-deep-research": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "o3-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.1
+  },
+  "o3-pro": {
+    charsPerToken: 4,
+    inputCostPerMillion: 20
+  },
   "o4-mini": {
     charsPerToken: 4,
-    inputCostPerMillion: 4
+    inputCostPerMillion: 1.1
+  },
+  "o4-mini-deep-research": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
   },
   // ===================
   // Anthropic Models
@@ -204,6 +407,79 @@ function getAvailableModels() {
   return Object.keys(DEFAULT_MODELS);
 }
+// src/openai-bpe.ts
+var import_node_module = require("module");
+var import_constants = require("gpt-tokenizer/constants");
+var import_mapping = require("gpt-tokenizer/mapping");
+var import_meta = {};
+var requireBase = typeof __filename === "string" && __filename.length > 0 ? __filename : import_meta.url;
+var NODE_REQUIRE = (0, import_node_module.createRequire)(requireBase);
+var ENCODING_MODULES = {
+  r50k_base: "gpt-tokenizer/cjs/encoding/r50k_base",
+  p50k_base: "gpt-tokenizer/cjs/encoding/p50k_base",
+  p50k_edit: "gpt-tokenizer/cjs/encoding/p50k_edit",
+  cl100k_base: "gpt-tokenizer/cjs/encoding/cl100k_base",
+  o200k_base: "gpt-tokenizer/cjs/encoding/o200k_base",
+  o200k_harmony: "gpt-tokenizer/cjs/encoding/o200k_harmony"
+};
+var encodingApiCache = /* @__PURE__ */ new Map();
+function getEncodingApi(encoding) {
+  const cached = encodingApiCache.get(encoding);
+  if (cached) return cached;
+  const modulePath = ENCODING_MODULES[encoding];
+  const mod = NODE_REQUIRE(modulePath);
+  const api = { encode: mod.encode, decode: mod.decode };
+  encodingApiCache.set(encoding, api);
+  return api;
+}
+function resolveEncoding(selector) {
+  if (selector?.encoding) {
+    return selector.encoding;
+  }
+  const model = selector?.model?.trim();
+  if (model) {
+    const mapped = import_mapping.modelToEncodingMap[model];
+    if (mapped) {
+      return mapped;
+    }
+  }
+  return import_mapping.DEFAULT_ENCODING;
+}
+function getOpenAIEncoding(selector) {
+  return resolveEncoding(selector);
+}
+function toGptTokenizerEncodeOptions(allowSpecial) {
+  const mode = allowSpecial ?? "none_raise";
+  switch (mode) {
+    case "all":
+      return {
+        allowedSpecial: import_constants.ALL_SPECIAL_TOKENS,
+        disallowedSpecial: /* @__PURE__ */ new Set()
+      };
+    case "none":
+      return {
+        allowedSpecial: /* @__PURE__ */ new Set(),
+        disallowedSpecial: /* @__PURE__ */ new Set()
+      };
+    case "none_raise":
+    default:
+      return {
+        disallowedSpecial: import_constants.ALL_SPECIAL_TOKENS
+      };
+  }
+}
+function encode(text, options) {
+  const encoding = resolveEncoding(options);
+  const api = getEncodingApi(encoding);
+  const encodeOptions = toGptTokenizerEncodeOptions(options?.allowSpecial);
+  return api.encode(text, encodeOptions);
+}
+function decode(tokens, options) {
+  const encoding = resolveEncoding(options);
+  const api = getEncodingApi(encoding);
+  return api.decode(tokens);
+}
 // src/estimator.ts
 function countCodePoints(text) {
   let count = 0;
@@ -213,21 +489,43 @@ function countCodePoints(text) {
   return count;
 }
 function estimate(input) {
-  const { text, model, rounding = "ceil" } = input;
+  const { text, model, rounding = "ceil", tokenizer = "heuristic" } = input;
   const config = getModelConfig(model);
   const characterCount = countCodePoints(text);
-  const rawTokens = characterCount / config.charsPerToken;
+  const isNonOpenAIModel2 = model.startsWith("claude-") || model.startsWith("gemini-");
   let estimatedTokens;
-  switch (rounding) {
-    case "floor":
-      estimatedTokens = Math.floor(rawTokens);
-      break;
-    case "round":
-      estimatedTokens = Math.round(rawTokens);
-      break;
-    case "ceil":
-    default:
-      estimatedTokens = Math.ceil(rawTokens);
+  let tokenizerModeUsed = "heuristic";
+  let encodingUsed;
+  const shouldTryExact = tokenizer === "openai_exact" || tokenizer === "auto";
+  if (shouldTryExact && !isNonOpenAIModel2) {
+    try {
+      estimatedTokens = encode(text, { model, allowSpecial: "none" }).length;
+      tokenizerModeUsed = "openai_exact";
+      encodingUsed = getOpenAIEncoding({ model });
+    } catch (error) {
+      if (tokenizer === "openai_exact") {
+        throw error;
+      }
+    }
+  } else if (tokenizer === "openai_exact" && isNonOpenAIModel2) {
+    throw new Error(
+      `Tokenizer mode "openai_exact" requested for non-OpenAI model: "${model}"`
+    );
+  }
+  if (estimatedTokens === void 0) {
+    const rawTokens = characterCount / config.charsPerToken;
+    switch (rounding) {
+      case "floor":
+        estimatedTokens = Math.floor(rawTokens);
+        break;
+      case "round":
+        estimatedTokens = Math.round(rawTokens);
+        break;
+      case "ceil":
+      default:
+        estimatedTokens = Math.ceil(rawTokens);
+    }
+    tokenizerModeUsed = "heuristic";
   }
   const estimatedInputCost = estimatedTokens * config.inputCostPerMillion / 1e6;
   return {
@@ -235,13 +533,44 @@ function estimate(input) {
     characterCount,
     estimatedTokens,
     estimatedInputCost,
-    charsPerToken: config.charsPerToken
+    charsPerToken: config.charsPerToken,
+    tokenizerMode: tokenizerModeUsed,
+    encodingUsed
   };
 }
+// src/token-counter.ts
+function isNonOpenAIModel(model) {
+  return model.startsWith("claude-") || model.startsWith("gemini-");
+}
+function countTokens(input) {
+  const { text, model } = input;
+  if (isNonOpenAIModel(model)) {
+    return {
+      tokens: estimate({ text, model }).estimatedTokens,
+      exact: false
+    };
+  }
+  try {
+    return {
+      tokens: encode(text, { model, allowSpecial: "none" }).length,
+      exact: true,
+      encoding: getOpenAIEncoding({ model })
+    };
+  } catch {
+    return {
+      tokens: estimate({ text, model }).estimatedTokens,
+      exact: false
+    };
+  }
+}
 // Annotate the CommonJS export names for ESM import in node:
 0 && (module.exports = {
   DEFAULT_MODELS,
   LAST_UPDATED,
+  countTokens,
+  decode,
+  encode,
   estimate,
   getAvailableModels,
   getModelConfig

package/dist/index.d.cts CHANGED Viewed

@@ -7,6 +7,7 @@ interface ModelConfig {
     /** Cost in USD per 1 million input tokens */
     inputCostPerMillion: number;
 }
+type TokenizerMode = 'heuristic' | 'openai_exact' | 'auto';
 /**
  * Input parameters for the estimate function.
  */
@@ -17,6 +18,13 @@ interface EstimateInput {
     model: string;
     /** Rounding strategy for token count (default: 'ceil') */
     rounding?: 'ceil' | 'round' | 'floor';
+    /**
+     * Token counting strategy.
+     * - `heuristic` (default): use chars-per-token ratios
+     * - `openai_exact`: use OpenAI BPE tokenization (throws if non-OpenAI model)
+     * - `auto`: use OpenAI BPE for OpenAI models, otherwise heuristic
+     */
+    tokenizer?: TokenizerMode;
 }
 /**
  * Output from the estimate function.
@@ -32,6 +40,10 @@ interface EstimateOutput {
     estimatedInputCost: number;
     /** The chars-per-token ratio used */
     charsPerToken: number;
+    /** Which tokenizer strategy was used */
+    tokenizerMode?: TokenizerMode;
+    /** OpenAI encoding used when tokenizerMode is `openai_exact` */
+    encodingUsed?: string;
 }
 /**
@@ -57,16 +69,16 @@ declare function estimate(input: EstimateInput): EstimateOutput;
  * Default model configurations.
  *
  * AUTO-GENERATED FILE - DO NOT EDIT MANUALLY
- * Last updated: 2025-12-25
+ * Last updated: 2026-01-14
  *
  * Sources:
- * - OpenAI: https://openai.com/api/pricing/
+ * - OpenAI: https://platform.openai.com/docs/pricing
  * - Anthropic: https://www.anthropic.com/pricing
  * - Google: https://ai.google.dev/gemini-api/docs/pricing
  *
  * This file is automatically updated weekly by GitHub Actions.
  */
-declare const LAST_UPDATED = "2025-12-25";
+declare const LAST_UPDATED = "2026-01-14";
 declare const DEFAULT_MODELS: Readonly<Record<string, Readonly<ModelConfig>>>;
 /**
  * Get configuration for a specific model.
@@ -81,4 +93,52 @@ declare function getModelConfig(model: string): ModelConfig;
  */
 declare function getAvailableModels(): string[];
-export { DEFAULT_MODELS, type EstimateInput, type EstimateOutput, LAST_UPDATED, type ModelConfig, estimate, getAvailableModels, getModelConfig };
+type OpenAIEncoding = 'r50k_base' | 'p50k_base' | 'p50k_edit' | 'cl100k_base' | 'o200k_base' | 'o200k_harmony';
+type SpecialTokenHandling = 'all' | 'none' | 'none_raise';
+interface EncodeOptions {
+    /**
+     * Explicit OpenAI encoding override.
+     * When provided, this takes precedence over `model`.
+     */
+    encoding?: OpenAIEncoding;
+    /**
+     * OpenAI model ID used to select the appropriate encoding.
+     */
+    model?: string;
+    /**
+     * How special tokens are handled.
+     * - `none_raise` (default): throw if special tokens appear
+     * - `none`: treat special tokens as regular text
+     * - `all`: allow special tokens and encode them as special token IDs
+     */
+    allowSpecial?: SpecialTokenHandling;
+}
+/**
+ * Encode text into OpenAI token IDs using tiktoken-compatible BPE encoding.
+ *
+ * This is exact tokenization for OpenAI models (unlike heuristic estimators).
+ */
+declare function encode(text: string, options?: EncodeOptions): number[];
+/**
+ * Decode OpenAI token IDs into text using tiktoken-compatible BPE encoding.
+ */
+declare function decode(tokens: Iterable<number>, options?: Pick<EncodeOptions, 'encoding' | 'model'>): string;
+interface TokenCountInput {
+    text: string;
+    model: string;
+}
+interface TokenCountOutput {
+    tokens: number;
+    exact: boolean;
+    encoding?: OpenAIEncoding;
+}
+/**
+ * Count tokens for a given model.
+ *
+ * - OpenAI models: exact BPE tokenization
+ * - Other providers: heuristic estimate (chars-per-token)
+ */
+declare function countTokens(input: TokenCountInput): TokenCountOutput;
+export { DEFAULT_MODELS, type EncodeOptions, type EstimateInput, type EstimateOutput, LAST_UPDATED, type ModelConfig, type OpenAIEncoding, type SpecialTokenHandling, type TokenCountInput, type TokenCountOutput, type TokenizerMode, countTokens, decode, encode, estimate, getAvailableModels, getModelConfig };

package/dist/index.d.ts CHANGED Viewed

@@ -7,6 +7,7 @@ interface ModelConfig {
     /** Cost in USD per 1 million input tokens */
     inputCostPerMillion: number;
 }
+type TokenizerMode = 'heuristic' | 'openai_exact' | 'auto';
 /**
  * Input parameters for the estimate function.
  */
@@ -17,6 +18,13 @@ interface EstimateInput {
     model: string;
     /** Rounding strategy for token count (default: 'ceil') */
     rounding?: 'ceil' | 'round' | 'floor';
+    /**
+     * Token counting strategy.
+     * - `heuristic` (default): use chars-per-token ratios
+     * - `openai_exact`: use OpenAI BPE tokenization (throws if non-OpenAI model)
+     * - `auto`: use OpenAI BPE for OpenAI models, otherwise heuristic
+     */
+    tokenizer?: TokenizerMode;
 }
 /**
  * Output from the estimate function.
@@ -32,6 +40,10 @@ interface EstimateOutput {
     estimatedInputCost: number;
     /** The chars-per-token ratio used */
     charsPerToken: number;
+    /** Which tokenizer strategy was used */
+    tokenizerMode?: TokenizerMode;
+    /** OpenAI encoding used when tokenizerMode is `openai_exact` */
+    encodingUsed?: string;
 }
 /**
@@ -57,16 +69,16 @@ declare function estimate(input: EstimateInput): EstimateOutput;
  * Default model configurations.
  *
  * AUTO-GENERATED FILE - DO NOT EDIT MANUALLY
- * Last updated: 2025-12-25
+ * Last updated: 2026-01-14
  *
  * Sources:
- * - OpenAI: https://openai.com/api/pricing/
+ * - OpenAI: https://platform.openai.com/docs/pricing
  * - Anthropic: https://www.anthropic.com/pricing
  * - Google: https://ai.google.dev/gemini-api/docs/pricing
  *
  * This file is automatically updated weekly by GitHub Actions.
  */
-declare const LAST_UPDATED = "2025-12-25";
+declare const LAST_UPDATED = "2026-01-14";
 declare const DEFAULT_MODELS: Readonly<Record<string, Readonly<ModelConfig>>>;
 /**
  * Get configuration for a specific model.
@@ -81,4 +93,52 @@ declare function getModelConfig(model: string): ModelConfig;
  */
 declare function getAvailableModels(): string[];
-export { DEFAULT_MODELS, type EstimateInput, type EstimateOutput, LAST_UPDATED, type ModelConfig, estimate, getAvailableModels, getModelConfig };
+type OpenAIEncoding = 'r50k_base' | 'p50k_base' | 'p50k_edit' | 'cl100k_base' | 'o200k_base' | 'o200k_harmony';
+type SpecialTokenHandling = 'all' | 'none' | 'none_raise';
+interface EncodeOptions {
+    /**
+     * Explicit OpenAI encoding override.
+     * When provided, this takes precedence over `model`.
+     */
+    encoding?: OpenAIEncoding;
+    /**
+     * OpenAI model ID used to select the appropriate encoding.
+     */
+    model?: string;
+    /**
+     * How special tokens are handled.
+     * - `none_raise` (default): throw if special tokens appear
+     * - `none`: treat special tokens as regular text
+     * - `all`: allow special tokens and encode them as special token IDs
+     */
+    allowSpecial?: SpecialTokenHandling;
+}
+/**
+ * Encode text into OpenAI token IDs using tiktoken-compatible BPE encoding.
+ *
+ * This is exact tokenization for OpenAI models (unlike heuristic estimators).
+ */
+declare function encode(text: string, options?: EncodeOptions): number[];
+/**
+ * Decode OpenAI token IDs into text using tiktoken-compatible BPE encoding.
+ */
+declare function decode(tokens: Iterable<number>, options?: Pick<EncodeOptions, 'encoding' | 'model'>): string;
+interface TokenCountInput {
+    text: string;
+    model: string;
+}
+interface TokenCountOutput {
+    tokens: number;
+    exact: boolean;
+    encoding?: OpenAIEncoding;
+}
+/**
+ * Count tokens for a given model.
+ *
+ * - OpenAI models: exact BPE tokenization
+ * - Other providers: heuristic estimate (chars-per-token)
+ */
+declare function countTokens(input: TokenCountInput): TokenCountOutput;
+export { DEFAULT_MODELS, type EncodeOptions, type EstimateInput, type EstimateOutput, LAST_UPDATED, type ModelConfig, type OpenAIEncoding, type SpecialTokenHandling, type TokenCountInput, type TokenCountOutput, type TokenizerMode, countTokens, decode, encode, estimate, getAvailableModels, getModelConfig };

package/dist/index.js CHANGED Viewed

@@ -1,42 +1,222 @@
 // src/models.ts
-var LAST_UPDATED = "2025-12-25";
+var LAST_UPDATED = "2026-01-14";
 var models = {
   // ===================
   // OpenAI Models
   // ===================
   // OpenAI uses ~4 chars per token for English text
-  "gpt-4.1": {
+  "babbage-002": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.4
+  },
+  "chatgpt-4o-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "chatgpt-image-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "codex-mini-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "computer-use-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 3
+  },
+  "davinci-002": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
+  "gpt-3.5-0301": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-3.5-turbo": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.5
+  },
+  "gpt-3.5-turbo-0125": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.5
+  },
+  "gpt-3.5-turbo-0613": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-3.5-turbo-1106": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1
+  },
+  "gpt-3.5-turbo-16k-0613": {
     charsPerToken: 4,
     inputCostPerMillion: 3
   },
+  "gpt-3.5-turbo-instruct": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.5
+  },
+  "gpt-4-0125-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-0314": {
+    charsPerToken: 4,
+    inputCostPerMillion: 30
+  },
+  "gpt-4-0613": {
+    charsPerToken: 4,
+    inputCostPerMillion: 30
+  },
+  "gpt-4-1106-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-1106-vision-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4-32k": {
+    charsPerToken: 4,
+    inputCostPerMillion: 60
+  },
+  "gpt-4-turbo-2024-04-09": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "gpt-4.1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
   "gpt-4.1-mini": {
     charsPerToken: 4,
-    inputCostPerMillion: 0.8
+    inputCostPerMillion: 0.4
   },
   "gpt-4.1-nano": {
     charsPerToken: 4,
-    inputCostPerMillion: 0.2
+    inputCostPerMillion: 0.1
   },
   "gpt-4o": {
     charsPerToken: 4,
     inputCostPerMillion: 2.5
   },
+  "gpt-4o-2024-05-13": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-4o-audio-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
   "gpt-4o-mini": {
     charsPerToken: 4,
     inputCostPerMillion: 0.15
   },
+  "gpt-4o-mini-audio-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.15
+  },
+  "gpt-4o-mini-realtime-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.6
+  },
+  "gpt-4o-mini-search-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.15
+  },
+  "gpt-4o-realtime-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-4o-search-preview": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
+  "gpt-5": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
   "gpt-5-mini": {
     charsPerToken: 4,
     inputCostPerMillion: 0.25
   },
+  "gpt-5-nano": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.05
+  },
+  "gpt-5-pro": {
+    charsPerToken: 4,
+    inputCostPerMillion: 15
+  },
+  "gpt-5-search-api": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex-max": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5.1-codex-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.25
+  },
+  "gpt-5-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
+  "gpt-5-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.25
+  },
   "gpt-5.2": {
     charsPerToken: 4,
     inputCostPerMillion: 1.75
   },
+  "gpt-5.2-chat-latest": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.75
+  },
+  "gpt-5.2-codex": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.75
+  },
   "gpt-5.2-pro": {
     charsPerToken: 4,
     inputCostPerMillion: 21
   },
+  "gpt-audio": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2.5
+  },
+  "gpt-audio-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 0.6
+  },
+  "gpt-image-1": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
+  "gpt-image-1-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
+  },
+  "gpt-image-1.5": {
+    charsPerToken: 4,
+    inputCostPerMillion: 5
+  },
   "gpt-realtime": {
     charsPerToken: 4,
     inputCostPerMillion: 4
@@ -49,6 +229,10 @@ var models = {
     charsPerToken: 4,
     inputCostPerMillion: 15
   },
+  "o1-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.1
+  },
   "o1-pro": {
     charsPerToken: 4,
     inputCostPerMillion: 150
@@ -57,9 +241,25 @@ var models = {
     charsPerToken: 4,
     inputCostPerMillion: 2
   },
+  "o3-deep-research": {
+    charsPerToken: 4,
+    inputCostPerMillion: 10
+  },
+  "o3-mini": {
+    charsPerToken: 4,
+    inputCostPerMillion: 1.1
+  },
+  "o3-pro": {
+    charsPerToken: 4,
+    inputCostPerMillion: 20
+  },
   "o4-mini": {
     charsPerToken: 4,
-    inputCostPerMillion: 4
+    inputCostPerMillion: 1.1
+  },
+  "o4-mini-deep-research": {
+    charsPerToken: 4,
+    inputCostPerMillion: 2
   },
   // ===================
   // Anthropic Models
@@ -174,6 +374,78 @@ function getAvailableModels() {
   return Object.keys(DEFAULT_MODELS);
 }
+// src/openai-bpe.ts
+import { createRequire } from "module";
+import { ALL_SPECIAL_TOKENS } from "gpt-tokenizer/constants";
+import { DEFAULT_ENCODING, modelToEncodingMap } from "gpt-tokenizer/mapping";
+var requireBase = typeof __filename === "string" && __filename.length > 0 ? __filename : import.meta.url;
+var NODE_REQUIRE = createRequire(requireBase);
+var ENCODING_MODULES = {
+  r50k_base: "gpt-tokenizer/cjs/encoding/r50k_base",
+  p50k_base: "gpt-tokenizer/cjs/encoding/p50k_base",
+  p50k_edit: "gpt-tokenizer/cjs/encoding/p50k_edit",
+  cl100k_base: "gpt-tokenizer/cjs/encoding/cl100k_base",
+  o200k_base: "gpt-tokenizer/cjs/encoding/o200k_base",
+  o200k_harmony: "gpt-tokenizer/cjs/encoding/o200k_harmony"
+};
+var encodingApiCache = /* @__PURE__ */ new Map();
+function getEncodingApi(encoding) {
+  const cached = encodingApiCache.get(encoding);
+  if (cached) return cached;
+  const modulePath = ENCODING_MODULES[encoding];
+  const mod = NODE_REQUIRE(modulePath);
+  const api = { encode: mod.encode, decode: mod.decode };
+  encodingApiCache.set(encoding, api);
+  return api;
+}
+function resolveEncoding(selector) {
+  if (selector?.encoding) {
+    return selector.encoding;
+  }
+  const model = selector?.model?.trim();
+  if (model) {
+    const mapped = modelToEncodingMap[model];
+    if (mapped) {
+      return mapped;
+    }
+  }
+  return DEFAULT_ENCODING;
+}
+function getOpenAIEncoding(selector) {
+  return resolveEncoding(selector);
+}
+function toGptTokenizerEncodeOptions(allowSpecial) {
+  const mode = allowSpecial ?? "none_raise";
+  switch (mode) {
+    case "all":
+      return {
+        allowedSpecial: ALL_SPECIAL_TOKENS,
+        disallowedSpecial: /* @__PURE__ */ new Set()
+      };
+    case "none":
+      return {
+        allowedSpecial: /* @__PURE__ */ new Set(),
+        disallowedSpecial: /* @__PURE__ */ new Set()
+      };
+    case "none_raise":
+    default:
+      return {
+        disallowedSpecial: ALL_SPECIAL_TOKENS
+      };
+  }
+}
+function encode(text, options) {
+  const encoding = resolveEncoding(options);
+  const api = getEncodingApi(encoding);
+  const encodeOptions = toGptTokenizerEncodeOptions(options?.allowSpecial);
+  return api.encode(text, encodeOptions);
+}
+function decode(tokens, options) {
+  const encoding = resolveEncoding(options);
+  const api = getEncodingApi(encoding);
+  return api.decode(tokens);
+}
 // src/estimator.ts
 function countCodePoints(text) {
   let count = 0;
@@ -183,21 +455,43 @@ function countCodePoints(text) {
   return count;
 }
 function estimate(input) {
-  const { text, model, rounding = "ceil" } = input;
+  const { text, model, rounding = "ceil", tokenizer = "heuristic" } = input;
   const config = getModelConfig(model);
   const characterCount = countCodePoints(text);
-  const rawTokens = characterCount / config.charsPerToken;
+  const isNonOpenAIModel2 = model.startsWith("claude-") || model.startsWith("gemini-");
   let estimatedTokens;
-  switch (rounding) {
-    case "floor":
-      estimatedTokens = Math.floor(rawTokens);
-      break;
-    case "round":
-      estimatedTokens = Math.round(rawTokens);
-      break;
-    case "ceil":
-    default:
-      estimatedTokens = Math.ceil(rawTokens);
+  let tokenizerModeUsed = "heuristic";
+  let encodingUsed;
+  const shouldTryExact = tokenizer === "openai_exact" || tokenizer === "auto";
+  if (shouldTryExact && !isNonOpenAIModel2) {
+    try {
+      estimatedTokens = encode(text, { model, allowSpecial: "none" }).length;
+      tokenizerModeUsed = "openai_exact";
+      encodingUsed = getOpenAIEncoding({ model });
+    } catch (error) {
+      if (tokenizer === "openai_exact") {
+        throw error;
+      }
+    }
+  } else if (tokenizer === "openai_exact" && isNonOpenAIModel2) {
+    throw new Error(
+      `Tokenizer mode "openai_exact" requested for non-OpenAI model: "${model}"`
+    );
+  }
+  if (estimatedTokens === void 0) {
+    const rawTokens = characterCount / config.charsPerToken;
+    switch (rounding) {
+      case "floor":
+        estimatedTokens = Math.floor(rawTokens);
+        break;
+      case "round":
+        estimatedTokens = Math.round(rawTokens);
+        break;
+      case "ceil":
+      default:
+        estimatedTokens = Math.ceil(rawTokens);
+    }
+    tokenizerModeUsed = "heuristic";
   }
   const estimatedInputCost = estimatedTokens * config.inputCostPerMillion / 1e6;
   return {
@@ -205,12 +499,43 @@ function estimate(input) {
     characterCount,
     estimatedTokens,
     estimatedInputCost,
-    charsPerToken: config.charsPerToken
+    charsPerToken: config.charsPerToken,
+    tokenizerMode: tokenizerModeUsed,
+    encodingUsed
   };
 }
+// src/token-counter.ts
+function isNonOpenAIModel(model) {
+  return model.startsWith("claude-") || model.startsWith("gemini-");
+}
+function countTokens(input) {
+  const { text, model } = input;
+  if (isNonOpenAIModel(model)) {
+    return {
+      tokens: estimate({ text, model }).estimatedTokens,
+      exact: false
+    };
+  }
+  try {
+    return {
+      tokens: encode(text, { model, allowSpecial: "none" }).length,
+      exact: true,
+      encoding: getOpenAIEncoding({ model })
+    };
+  } catch {
+    return {
+      tokens: estimate({ text, model }).estimatedTokens,
+      exact: false
+    };
+  }
+}
 export {
   DEFAULT_MODELS,
   LAST_UPDATED,
+  countTokens,
+  decode,
+  encode,
   estimate,
   getAvailableModels,
   getModelConfig

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "ai-token-estimator",
-  "version": "1.0.2",
+  "version": "1.1.0",
   "description": "Estimate token counts and costs for LLM API calls",
   "type": "module",
   "main": "./dist/index.cjs",
@@ -23,13 +23,17 @@
     "LICENSE",
     "README.md"
   ],
+  "dependencies": {
+    "gpt-tokenizer": "^3.4.0"
+  },
   "scripts": {
     "build": "tsup src/index.ts --format cjs,esm --dts",
     "test": "vitest run",
     "test:watch": "vitest",
     "lint": "eslint src tests",
     "prepublishOnly": "npm run lint && npm run test && npm run build",
-    "update-pricing": "tsx scripts/update-pricing.ts"
+    "update-pricing": "tsx scripts/update-pricing.ts",
+    "benchmark:tokenizer": "tsx benchmark/tokenizer.ts"
   },
   "keywords": [
     "llm",