npm - trickle-observe - Versions diffs - 0.2.124 → 0.2.126 - Mend

trickle-observe 0.2.124 → 0.2.126

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/llm-observer.js CHANGED Viewed

@@ -54,10 +54,10 @@ let llmFile = null;
 let eventCount = 0;
 const MAX_LLM_EVENTS = 500;
 const TRUNCATE_LEN = 500;
-// Token budget enforcement
+// Graduated token budget enforcement: alert 50%, warn 80%, exceeded 100%
 let cumulativeTokens = 0;
 let cumulativeCost = 0;
-let budgetWarned = false;
+let budgetLevel = 0; // 0=ok, 1=alert(50%), 2=warn(80%), 3=exceeded(100%)
 const TOKEN_BUDGET = parseInt(process.env.TRICKLE_TOKEN_BUDGET || '0', 10);
 const COST_BUDGET = parseFloat(process.env.TRICKLE_COST_BUDGET || '0');
 // Approximate pricing per 1M tokens (USD) — used for cost estimation
@@ -102,16 +102,26 @@ function writeLlmEvent(event) {
     // Track cumulative usage for budget enforcement
     cumulativeTokens += event.totalTokens || 0;
     cumulativeCost += event.estimatedCostUsd || 0;
-    if (!budgetWarned) {
-        if (TOKEN_BUDGET > 0 && cumulativeTokens > TOKEN_BUDGET) {
-            console.warn(`[trickle] ⚠ Token budget exceeded: ${cumulativeTokens} tokens used (budget: ${TOKEN_BUDGET}). Set TRICKLE_TOKEN_BUDGET=0 to disable.`);
-            budgetWarned = true;
+    // Graduated budget: alert at 50%, warn at 80%, exceeded at 100%
+    function checkBudget(current, budget, unit) {
+        if (budget <= 0)
+            return;
+        const pct = current / budget;
+        if (pct >= 1.0 && budgetLevel < 3) {
+            budgetLevel = 3;
+            console.warn(`[trickle] ❌ ${unit} budget EXCEEDED: ${current.toFixed(4)} / ${budget} (100%+). Consider stopping.`);
+        }
+        else if (pct >= 0.8 && budgetLevel < 2) {
+            budgetLevel = 2;
+            console.warn(`[trickle] ⚠ ${unit} budget at 80%: ${current.toFixed(4)} / ${budget}. Approaching limit.`);
         }
-        if (COST_BUDGET > 0 && cumulativeCost > COST_BUDGET) {
-            console.warn(`[trickle] ⚠ Cost budget exceeded: $${cumulativeCost.toFixed(4)} spent (budget: $${COST_BUDGET.toFixed(4)}). Set TRICKLE_COST_BUDGET=0 to disable.`);
-            budgetWarned = true;
+        else if (pct >= 0.5 && budgetLevel < 1) {
+            budgetLevel = 1;
+            console.warn(`[trickle] ℹ ${unit} budget at 50%: ${current.toFixed(4)} / ${budget}.`);
         }
     }
+    checkBudget(cumulativeTokens, TOKEN_BUDGET, 'Token');
+    checkBudget(cumulativeCost, COST_BUDGET, 'Cost ($)');
     try {
         fs.appendFileSync(getLlmFile(), JSON.stringify(event) + '\n');
     }
@@ -486,12 +496,16 @@ function handleAnthropicStream(stream, params, startTime, debug) {
 function captureAnthropicResponse(params, response, startTime, debug) {
     const usage = response.usage || {};
     const outputText = response.content?.map((c) => c.text || '').join('') || '';
+    const cacheRead = usage.cache_read_input_tokens || 0;
+    const cacheWrite = usage.cache_creation_input_tokens || 0;
     const event = {
         kind: 'llm_call', provider: 'anthropic', model: response.model || params.model || 'unknown',
         durationMs: round(performance.now() - startTime),
         inputTokens: usage.input_tokens || 0, outputTokens: usage.output_tokens || 0,
         totalTokens: (usage.input_tokens || 0) + (usage.output_tokens || 0),
         estimatedCostUsd: estimateCost(response.model || params.model || '', usage.input_tokens || 0, usage.output_tokens || 0),
+        ...(cacheRead > 0 ? { cacheReadTokens: cacheRead } : {}),
+        ...(cacheWrite > 0 ? { cacheWriteTokens: cacheWrite } : {}),
         stream: false, finishReason: response.stop_reason || 'unknown',
         temperature: params.temperature, maxTokens: params.max_tokens,
         systemPrompt: typeof params.system === 'string' ? truncate(params.system, 200) : undefined,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "trickle-observe",
-  "version": "0.2.124",
+  "version": "0.2.126",
   "description": "Zero-code runtime observability for JavaScript/TypeScript. Auto-instruments Express, OpenAI, Anthropic, Gemini, MCP. Captures functions, variables, LLM calls, agent workflows.",
   "main": "dist/index.js",
   "types": "dist/index.d.ts",

package/src/llm-observer.ts CHANGED Viewed

@@ -18,10 +18,10 @@ let eventCount = 0;
 const MAX_LLM_EVENTS = 500;
 const TRUNCATE_LEN = 500;
-// Token budget enforcement
+// Graduated token budget enforcement: alert 50%, warn 80%, exceeded 100%
 let cumulativeTokens = 0;
 let cumulativeCost = 0;
-let budgetWarned = false;
+let budgetLevel = 0; // 0=ok, 1=alert(50%), 2=warn(80%), 3=exceeded(100%)
 const TOKEN_BUDGET = parseInt(process.env.TRICKLE_TOKEN_BUDGET || '0', 10);
 const COST_BUDGET = parseFloat(process.env.TRICKLE_COST_BUDGET || '0');
@@ -67,6 +67,8 @@ interface LlmEvent {
   outputTokens: number;
   totalTokens: number;
   estimatedCostUsd: number;
+  cacheReadTokens?: number;
+  cacheWriteTokens?: number;
   stream: boolean;
   finishReason: string;
   temperature?: number;
@@ -88,16 +90,23 @@ function writeLlmEvent(event: LlmEvent): void {
   cumulativeTokens += event.totalTokens || 0;
   cumulativeCost += event.estimatedCostUsd || 0;
-  if (!budgetWarned) {
-    if (TOKEN_BUDGET > 0 && cumulativeTokens > TOKEN_BUDGET) {
-      console.warn(`[trickle] ⚠ Token budget exceeded: ${cumulativeTokens} tokens used (budget: ${TOKEN_BUDGET}). Set TRICKLE_TOKEN_BUDGET=0 to disable.`);
-      budgetWarned = true;
-    }
-    if (COST_BUDGET > 0 && cumulativeCost > COST_BUDGET) {
-      console.warn(`[trickle] ⚠ Cost budget exceeded: $${cumulativeCost.toFixed(4)} spent (budget: $${COST_BUDGET.toFixed(4)}). Set TRICKLE_COST_BUDGET=0 to disable.`);
-      budgetWarned = true;
+  // Graduated budget: alert at 50%, warn at 80%, exceeded at 100%
+  function checkBudget(current: number, budget: number, unit: string): void {
+    if (budget <= 0) return;
+    const pct = current / budget;
+    if (pct >= 1.0 && budgetLevel < 3) {
+      budgetLevel = 3;
+      console.warn(`[trickle] ❌ ${unit} budget EXCEEDED: ${current.toFixed(4)} / ${budget} (100%+). Consider stopping.`);
+    } else if (pct >= 0.8 && budgetLevel < 2) {
+      budgetLevel = 2;
+      console.warn(`[trickle] ⚠ ${unit} budget at 80%: ${current.toFixed(4)} / ${budget}. Approaching limit.`);
+    } else if (pct >= 0.5 && budgetLevel < 1) {
+      budgetLevel = 1;
+      console.warn(`[trickle] ℹ ${unit} budget at 50%: ${current.toFixed(4)} / ${budget}.`);
     }
   }
+  checkBudget(cumulativeTokens, TOKEN_BUDGET, 'Token');
+  checkBudget(cumulativeCost, COST_BUDGET, 'Cost ($)');
   try {
     fs.appendFileSync(getLlmFile(), JSON.stringify(event) + '\n');
   } catch {}
@@ -479,12 +488,16 @@ function handleAnthropicStream(stream: any, params: any, startTime: number, debu
 function captureAnthropicResponse(params: any, response: any, startTime: number, debug: boolean): void {
   const usage = response.usage || {};
   const outputText = response.content?.map((c: any) => c.text || '').join('') || '';
+  const cacheRead = usage.cache_read_input_tokens || 0;
+  const cacheWrite = usage.cache_creation_input_tokens || 0;
   const event: LlmEvent = {
     kind: 'llm_call', provider: 'anthropic', model: response.model || params.model || 'unknown',
     durationMs: round(performance.now() - startTime),
     inputTokens: usage.input_tokens || 0, outputTokens: usage.output_tokens || 0,
     totalTokens: (usage.input_tokens || 0) + (usage.output_tokens || 0),
     estimatedCostUsd: estimateCost(response.model || params.model || '', usage.input_tokens || 0, usage.output_tokens || 0),
+    ...(cacheRead > 0 ? { cacheReadTokens: cacheRead } : {}),
+    ...(cacheWrite > 0 ? { cacheWriteTokens: cacheWrite } : {}),
     stream: false, finishReason: response.stop_reason || 'unknown',
     temperature: params.temperature, maxTokens: params.max_tokens,
     systemPrompt: typeof params.system === 'string' ? truncate(params.system, 200) : undefined,