npm - @axlsdk/axl - Versions diffs - 0.7.5 → 0.7.6 - Mend

@axlsdk/axl 0.7.5 → 0.7.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/index.cjs CHANGED Viewed

@@ -310,29 +310,32 @@ async function fetchWithRetry(input, init, maxRetries = MAX_RETRIES) {
 // src/providers/openai.ts
 var OPENAI_PRICING = {
-  "gpt-4o": [25e-7, 1e-5],
-  "gpt-4o-mini": [15e-8, 6e-7],
-  "gpt-4-turbo": [1e-5, 3e-5],
-  "gpt-4": [3e-5, 6e-5],
-  "gpt-3.5-turbo": [5e-7, 15e-7],
-  "gpt-5": [125e-8, 1e-5],
-  "gpt-5-mini": [25e-8, 2e-6],
-  "gpt-5-nano": [5e-8, 4e-7],
-  "gpt-5.1": [125e-8, 1e-5],
-  "gpt-5.2": [175e-8, 14e-6],
-  "gpt-5.3": [175e-8, 14e-6],
-  "gpt-5.4": [25e-7, 15e-6],
-  "gpt-5.4-pro": [3e-5, 18e-5],
-  o1: [15e-6, 6e-5],
-  "o1-mini": [3e-6, 12e-6],
-  "o1-pro": [15e-5, 6e-4],
-  o3: [1e-5, 4e-5],
-  "o3-mini": [11e-7, 44e-7],
-  "o3-pro": [2e-5, 8e-5],
-  "o4-mini": [11e-7, 44e-7],
-  "gpt-4.1": [2e-6, 8e-6],
-  "gpt-4.1-mini": [4e-7, 16e-7],
-  "gpt-4.1-nano": [1e-7, 4e-7]
+  // gpt-4o era — cache reads at 50% of input rate
+  "gpt-4o": [25e-7, 1e-5, 0.5],
+  "gpt-4o-mini": [15e-8, 6e-7, 0.5],
+  "gpt-4-turbo": [1e-5, 3e-5, 0.5],
+  "gpt-4": [3e-5, 6e-5, 0.5],
+  "gpt-3.5-turbo": [5e-7, 15e-7, 0.5],
+  o1: [15e-6, 6e-5, 0.5],
+  "o1-mini": [3e-6, 12e-6, 0.5],
+  "o1-pro": [15e-5, 6e-4, 0.5],
+  // gpt-4.1 / o3 / o4 era — cache reads at 25% of input rate
+  "gpt-4.1": [2e-6, 8e-6, 0.25],
+  "gpt-4.1-mini": [4e-7, 16e-7, 0.25],
+  "gpt-4.1-nano": [1e-7, 4e-7, 0.25],
+  o3: [1e-5, 4e-5, 0.25],
+  "o3-mini": [11e-7, 44e-7, 0.25],
+  "o3-pro": [2e-5, 8e-5, 0.25],
+  "o4-mini": [11e-7, 44e-7, 0.25],
+  // gpt-5 era — cache reads at 10% of input rate
+  "gpt-5": [125e-8, 1e-5, 0.1],
+  "gpt-5-mini": [25e-8, 2e-6, 0.1],
+  "gpt-5-nano": [5e-8, 4e-7, 0.1],
+  "gpt-5.1": [125e-8, 1e-5, 0.1],
+  "gpt-5.2": [175e-8, 14e-6, 0.1],
+  "gpt-5.3": [175e-8, 14e-6, 0.1],
+  "gpt-5.4": [25e-7, 15e-6, 0.1],
+  "gpt-5.4-pro": [3e-5, 18e-5, 0.1]
 };
 var PRICING_KEYS_BY_LENGTH = Object.keys(OPENAI_PRICING).sort((a, b) => b.length - a.length);
 function estimateOpenAICost(model, promptTokens, completionTokens, cachedTokens) {
@@ -346,9 +349,9 @@ function estimateOpenAICost(model, promptTokens, completionTokens, cachedTokens)
     }
   }
   if (!pricing) return 0;
-  const [inputRate, outputRate] = pricing;
+  const [inputRate, outputRate, cacheMultiplier] = pricing;
   const cached = cachedTokens ?? 0;
-  const inputCost = (promptTokens - cached) * inputRate + cached * inputRate * 0.5;
+  const inputCost = (promptTokens - cached) * inputRate + cached * inputRate * cacheMultiplier;
   return inputCost + completionTokens * outputRate;
 }
 function isOSeriesModel(model) {
@@ -458,7 +461,7 @@ var OpenAIProvider = class {
     if (!res.body) {
       throw new Error("OpenAI stream response has no body");
     }
-    yield* this.parseSSEStream(res.body);
+    yield* this.parseSSEStream(res.body, options.model);
   }
   // ---------------------------------------------------------------------------
   // Internal helpers
@@ -532,7 +535,7 @@ var OpenAIProvider = class {
     if (msg.tool_call_id) out.tool_call_id = msg.tool_call_id;
     return out;
   }
-  async *parseSSEStream(body) {
+  async *parseSSEStream(body, model) {
     const reader = body.getReader();
     const decoder = new TextDecoder();
     let buffer = "";
@@ -549,7 +552,16 @@ var OpenAIProvider = class {
           const trimmed = line.trim();
           if (!trimmed || trimmed.startsWith(":")) continue;
           if (trimmed === "data: [DONE]") {
-            yield { type: "done", usage: usageData };
+            yield {
+              type: "done",
+              usage: usageData,
+              cost: usageData ? estimateOpenAICost(
+                model,
+                usageData.prompt_tokens,
+                usageData.completion_tokens,
+                usageData.cached_tokens
+              ) : void 0
+            };
             return;
           }
           if (trimmed.startsWith("data: ")) {
@@ -592,7 +604,16 @@ var OpenAIProvider = class {
           }
         }
       }
-      yield { type: "done", usage: usageData };
+      yield {
+        type: "done",
+        usage: usageData,
+        cost: usageData ? estimateOpenAICost(
+          model,
+          usageData.prompt_tokens,
+          usageData.completion_tokens,
+          usageData.cached_tokens
+        ) : void 0
+      };
     } finally {
       reader.releaseLock();
     }
@@ -850,6 +871,7 @@ var OpenAIResponsesProvider = class {
     const decoder = new TextDecoder();
     let buffer = "";
     const callIdMap = /* @__PURE__ */ new Map();
+    let eventType = "";
     try {
       while (true) {
         const { done, value } = await reader.read();
@@ -857,7 +879,6 @@ var OpenAIResponsesProvider = class {
         buffer += decoder.decode(value, { stream: true });
         const lines = buffer.split("\n");
         buffer = lines.pop() ?? "";
-        let eventType = "";
         for (const line of lines) {
           const trimmed = line.trim();
           if (!trimmed || trimmed.startsWith(":")) continue;
@@ -925,7 +946,17 @@ var OpenAIResponsesProvider = class {
         } : void 0;
         const reasoningItems = response?.output?.filter((item) => item.type === "reasoning") ?? [];
         const providerMetadata = reasoningItems.length > 0 ? { openaiReasoningItems: reasoningItems } : void 0;
-        return { type: "done", usage, providerMetadata };
+        return {
+          type: "done",
+          usage,
+          cost: usage ? estimateOpenAICost(
+            model,
+            usage.prompt_tokens,
+            usage.completion_tokens,
+            usage.cached_tokens
+          ) : void 0,
+          providerMetadata
+        };
       }
       case "response.failed": {
         const errorMsg = data.response?.error?.message ?? data.response?.status_details?.error?.message ?? "Unknown error";
@@ -1058,7 +1089,7 @@ var AnthropicProvider = class {
     if (!res.body) {
       throw new Error("Anthropic stream response has no body");
     }
-    yield* this.parseSSEStream(res.body);
+    yield* this.parseSSEStream(res.body, options.model);
   }
   // ---------------------------------------------------------------------------
   // Internal: request building
@@ -1301,13 +1332,14 @@ ${jsonInstruction}` : jsonInstruction;
   // ---------------------------------------------------------------------------
   // Internal: SSE stream parsing
   // ---------------------------------------------------------------------------
-  async *parseSSEStream(body) {
+  async *parseSSEStream(body, model) {
     const reader = body.getReader();
     const decoder = new TextDecoder();
     let buffer = "";
     let currentToolId = "";
     let currentToolName = "";
     let usage;
+    let cacheWrite = 0;
     try {
       while (true) {
         const { done, value } = await reader.read();
@@ -1364,7 +1396,7 @@ ${jsonInstruction}` : jsonInstruction;
             case "message_start": {
               if (event.message?.usage) {
                 const cacheRead = event.message.usage.cache_read_input_tokens ?? 0;
-                const cacheWrite = event.message.usage.cache_creation_input_tokens ?? 0;
+                cacheWrite = event.message.usage.cache_creation_input_tokens ?? 0;
                 const inputTokens = (event.message.usage.input_tokens ?? 0) + cacheRead + cacheWrite;
                 usage = {
                   prompt_tokens: inputTokens,
@@ -1395,13 +1427,33 @@ ${jsonInstruction}` : jsonInstruction;
               if (usage) {
                 usage.total_tokens = usage.prompt_tokens + usage.completion_tokens;
               }
-              yield { type: "done", usage };
+              yield {
+                type: "done",
+                usage,
+                cost: usage ? estimateAnthropicCost(
+                  model,
+                  usage.prompt_tokens,
+                  usage.completion_tokens,
+                  usage.cached_tokens,
+                  cacheWrite
+                ) : void 0
+              };
               return;
             }
           }
         }
       }
-      yield { type: "done", usage };
+      yield {
+        type: "done",
+        usage,
+        cost: usage ? estimateAnthropicCost(
+          model,
+          usage.prompt_tokens,
+          usage.completion_tokens,
+          usage.cached_tokens,
+          cacheWrite
+        ) : void 0
+      };
     } finally {
       reader.releaseLock();
     }
@@ -1528,7 +1580,7 @@ var GeminiProvider = class {
     if (!res.body) {
       throw new Error("Gemini stream response has no body");
     }
-    yield* this.parseSSEStream(res.body);
+    yield* this.parseSSEStream(res.body, options.model);
   }
   // ---------------------------------------------------------------------------
   // Internal: request building
@@ -1809,7 +1861,7 @@ var GeminiProvider = class {
   // ---------------------------------------------------------------------------
   // Internal: SSE stream parsing
   // ---------------------------------------------------------------------------
-  async *parseSSEStream(body) {
+  async *parseSSEStream(body, model) {
     const reader = body.getReader();
     const decoder = new TextDecoder();
     let buffer = "";
@@ -1865,7 +1917,17 @@ var GeminiProvider = class {
         }
       }
       const providerMetadata = accumulatedParts.length > 0 ? { geminiParts: accumulatedParts } : void 0;
-      yield { type: "done", usage, providerMetadata };
+      yield {
+        type: "done",
+        usage,
+        cost: usage ? estimateGeminiCost(
+          model,
+          usage.prompt_tokens,
+          usage.completion_tokens,
+          usage.cached_tokens
+        ) : void 0,
+        providerMetadata
+      };
     } finally {
       reader.releaseLock();
     }
@@ -2575,7 +2637,8 @@ Please fix and try again.`;
               response = {
                 content: content2,
                 tool_calls: void 0,
-                usage: chunk.usage
+                usage: chunk.usage,
+                cost: chunk.cost
               };
             }
           }