npm - caplyr - Versions diffs - 0.2.3 → 0.2.4 - Mend

caplyr 0.2.3 → 0.2.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/index.js CHANGED Viewed

@@ -107,6 +107,36 @@ var LogShipper = class {
   }
 };
+// src/mutex.ts
+var Mutex = class {
+  constructor() {
+    this.queue = [];
+    this.locked = false;
+  }
+  async acquire() {
+    if (!this.locked) {
+      this.locked = true;
+      return this.createRelease();
+    }
+    return new Promise((resolve) => {
+      this.queue.push(() => resolve(this.createRelease()));
+    });
+  }
+  createRelease() {
+    let released = false;
+    return () => {
+      if (released) return;
+      released = true;
+      const next = this.queue.shift();
+      if (next) {
+        next();
+      } else {
+        this.locked = false;
+      }
+    };
+  }
+};
 // src/heartbeat.ts
 var Heartbeat = class {
   constructor(config) {
@@ -124,6 +154,8 @@ var Heartbeat = class {
     };
     /** Current protection status */
     this.status = "ACTIVE";
+    /** Mutex for serializing budget check → API call → trackSpend */
+    this.budgetMutex = new Mutex();
     /** Local budget limits set via config (not from server) */
     this.localDailyLimit = null;
     this.localMonthlyLimit = null;
@@ -382,18 +414,98 @@ function wrapAnthropic(client, config, shipper, heartbeat) {
               });
             }
           }
-          if (config.mode === "cost_protect") {
-            if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
-              blocked = true;
-              enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
-              const blockError = {
-                code: "BUDGET_EXCEEDED",
-                message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
-                budget_used: heartbeat.budgetStatus.monthly_used,
-                budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                retry_after: getNextResetTime(enforcementReason),
-                dashboard_url: dashboardUrl
-              };
+          const release = await heartbeat.budgetMutex.acquire();
+          try {
+            if (config.mode === "cost_protect") {
+              if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
+                blocked = true;
+                enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
+                const blockError = {
+                  code: "BUDGET_EXCEEDED",
+                  message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
+                  budget_used: heartbeat.budgetStatus.monthly_used,
+                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                  retry_after: getNextResetTime(enforcementReason),
+                  dashboard_url: dashboardUrl
+                };
+                shipper.push({
+                  id: generateId(),
+                  timestamp: startTime,
+                  provider: "anthropic",
+                  model,
+                  input_tokens: 0,
+                  output_tokens: 0,
+                  cost: 0,
+                  latency_ms: Date.now() - startTime,
+                  endpoint_tag: config.endpoint_tag,
+                  downgraded: false,
+                  blocked: true,
+                  enforcement_reason: enforcementReason
+                });
+                throw Object.assign(new Error(blockError.message), {
+                  caplyr: blockError
+                });
+              }
+              if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
+                const fallback = config.fallback ?? getDefaultFallback(model);
+                if (fallback && fallback !== model) {
+                  originalModel = model;
+                  model = fallback;
+                  downgraded = true;
+                  enforcementReason = "auto_downgrade_threshold";
+                  config.onEnforcement?.({
+                    type: "downgrade",
+                    timestamp: Date.now(),
+                    reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
+                    original_model: originalModel,
+                    fallback_model: model,
+                    budget_used: heartbeat.budgetStatus.monthly_used,
+                    budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                    estimated_savings: 0
+                    // Calculated after response
+                  });
+                }
+              }
+            }
+            const requestParams = downgraded ? { ...params, model } : params;
+            try {
+              const response = await target.create.call(
+                target,
+                requestParams,
+                options
+              );
+              const latency = Date.now() - startTime;
+              const inputTokens = response?.usage?.input_tokens ?? 0;
+              const outputTokens = response?.usage?.output_tokens ?? 0;
+              const cost = calculateCost(model, inputTokens, outputTokens);
+              heartbeat.trackSpend(cost);
+              let estimatedSavings = 0;
+              if (downgraded && originalModel) {
+                const originalCost = calculateCost(
+                  originalModel,
+                  inputTokens,
+                  outputTokens
+                );
+                estimatedSavings = originalCost - cost;
+              }
+              shipper.push({
+                id: generateId(),
+                timestamp: startTime,
+                provider: "anthropic",
+                model,
+                input_tokens: inputTokens,
+                output_tokens: outputTokens,
+                cost,
+                latency_ms: latency,
+                endpoint_tag: config.endpoint_tag,
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: enforcementReason
+              });
+              return response;
+            } catch (err) {
+              if (err?.caplyr) throw err;
               shipper.push({
                 id: generateId(),
                 timestamp: startTime,
@@ -404,90 +516,15 @@ function wrapAnthropic(client, config, shipper, heartbeat) {
                 cost: 0,
                 latency_ms: Date.now() - startTime,
                 endpoint_tag: config.endpoint_tag,
-                downgraded: false,
-                blocked: true,
-                enforcement_reason: enforcementReason
-              });
-              throw Object.assign(new Error(blockError.message), {
-                caplyr: blockError
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: "provider_error"
               });
+              throw err;
             }
-            if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
-              const fallback = config.fallback ?? getDefaultFallback(model);
-              if (fallback && fallback !== model) {
-                originalModel = model;
-                model = fallback;
-                downgraded = true;
-                enforcementReason = "auto_downgrade_threshold";
-                config.onEnforcement?.({
-                  type: "downgrade",
-                  timestamp: Date.now(),
-                  reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
-                  original_model: originalModel,
-                  fallback_model: model,
-                  budget_used: heartbeat.budgetStatus.monthly_used,
-                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                  estimated_savings: 0
-                  // Calculated after response
-                });
-              }
-            }
-          }
-          const requestParams = downgraded ? { ...params, model } : params;
-          try {
-            const response = await target.create.call(
-              target,
-              requestParams,
-              options
-            );
-            const latency = Date.now() - startTime;
-            const inputTokens = response?.usage?.input_tokens ?? 0;
-            const outputTokens = response?.usage?.output_tokens ?? 0;
-            const cost = calculateCost(model, inputTokens, outputTokens);
-            heartbeat.trackSpend(cost);
-            let estimatedSavings = 0;
-            if (downgraded && originalModel) {
-              const originalCost = calculateCost(
-                originalModel,
-                inputTokens,
-                outputTokens
-              );
-              estimatedSavings = originalCost - cost;
-            }
-            shipper.push({
-              id: generateId(),
-              timestamp: startTime,
-              provider: "anthropic",
-              model,
-              input_tokens: inputTokens,
-              output_tokens: outputTokens,
-              cost,
-              latency_ms: latency,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: enforcementReason
-            });
-            return response;
-          } catch (err) {
-            if (err?.caplyr) throw err;
-            shipper.push({
-              id: generateId(),
-              timestamp: startTime,
-              provider: "anthropic",
-              model,
-              input_tokens: 0,
-              output_tokens: 0,
-              cost: 0,
-              latency_ms: Date.now() - startTime,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: "provider_error"
-            });
-            throw err;
+          } finally {
+            release();
           }
         };
       }
@@ -564,18 +601,89 @@ function wrapOpenAI(client, config, shipper, heartbeat) {
               });
             }
           }
-          if (config.mode === "cost_protect") {
-            if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
-              blocked = true;
-              enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
-              const blockError = {
-                code: "BUDGET_EXCEEDED",
-                message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
-                budget_used: heartbeat.budgetStatus.monthly_used,
-                budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                retry_after: getNextResetTime2(enforcementReason),
-                dashboard_url: dashboardUrl
-              };
+          const release = await heartbeat.budgetMutex.acquire();
+          try {
+            if (config.mode === "cost_protect") {
+              if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
+                blocked = true;
+                enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
+                const blockError = {
+                  code: "BUDGET_EXCEEDED",
+                  message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
+                  budget_used: heartbeat.budgetStatus.monthly_used,
+                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                  retry_after: getNextResetTime2(enforcementReason),
+                  dashboard_url: dashboardUrl
+                };
+                shipper.push({
+                  id: generateId2(),
+                  timestamp: startTime,
+                  provider: "openai",
+                  model,
+                  input_tokens: 0,
+                  output_tokens: 0,
+                  cost: 0,
+                  latency_ms: Date.now() - startTime,
+                  endpoint_tag: config.endpoint_tag,
+                  downgraded: false,
+                  blocked: true,
+                  enforcement_reason: enforcementReason
+                });
+                throw Object.assign(new Error(blockError.message), {
+                  caplyr: blockError
+                });
+              }
+              if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
+                const fallback = config.fallback ?? getDefaultFallback(model);
+                if (fallback && fallback !== model) {
+                  originalModel = model;
+                  model = fallback;
+                  downgraded = true;
+                  enforcementReason = "auto_downgrade_threshold";
+                  config.onEnforcement?.({
+                    type: "downgrade",
+                    timestamp: Date.now(),
+                    reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
+                    original_model: originalModel,
+                    fallback_model: model,
+                    budget_used: heartbeat.budgetStatus.monthly_used,
+                    budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                    estimated_savings: 0
+                  });
+                }
+              }
+            }
+            const requestParams = downgraded ? { ...params, model } : params;
+            try {
+              const response = await target.create.call(
+                target,
+                requestParams,
+                options
+              );
+              const latency = Date.now() - startTime;
+              const usage = response?.usage;
+              const inputTokens = usage?.prompt_tokens ?? 0;
+              const outputTokens = usage?.completion_tokens ?? 0;
+              const cost = calculateCost(model, inputTokens, outputTokens);
+              heartbeat.trackSpend(cost);
+              shipper.push({
+                id: generateId2(),
+                timestamp: startTime,
+                provider: "openai",
+                model,
+                input_tokens: inputTokens,
+                output_tokens: outputTokens,
+                cost,
+                latency_ms: latency,
+                endpoint_tag: config.endpoint_tag,
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: enforcementReason
+              });
+              return response;
+            } catch (err) {
+              if (err?.caplyr) throw err;
               shipper.push({
                 id: generateId2(),
                 timestamp: startTime,
@@ -586,81 +694,15 @@ function wrapOpenAI(client, config, shipper, heartbeat) {
                 cost: 0,
                 latency_ms: Date.now() - startTime,
                 endpoint_tag: config.endpoint_tag,
-                downgraded: false,
-                blocked: true,
-                enforcement_reason: enforcementReason
-              });
-              throw Object.assign(new Error(blockError.message), {
-                caplyr: blockError
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: "provider_error"
               });
+              throw err;
             }
-            if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
-              const fallback = config.fallback ?? getDefaultFallback(model);
-              if (fallback && fallback !== model) {
-                originalModel = model;
-                model = fallback;
-                downgraded = true;
-                enforcementReason = "auto_downgrade_threshold";
-                config.onEnforcement?.({
-                  type: "downgrade",
-                  timestamp: Date.now(),
-                  reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
-                  original_model: originalModel,
-                  fallback_model: model,
-                  budget_used: heartbeat.budgetStatus.monthly_used,
-                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                  estimated_savings: 0
-                });
-              }
-            }
-          }
-          const requestParams = downgraded ? { ...params, model } : params;
-          try {
-            const response = await target.create.call(
-              target,
-              requestParams,
-              options
-            );
-            const latency = Date.now() - startTime;
-            const usage = response?.usage;
-            const inputTokens = usage?.prompt_tokens ?? 0;
-            const outputTokens = usage?.completion_tokens ?? 0;
-            const cost = calculateCost(model, inputTokens, outputTokens);
-            heartbeat.trackSpend(cost);
-            shipper.push({
-              id: generateId2(),
-              timestamp: startTime,
-              provider: "openai",
-              model,
-              input_tokens: inputTokens,
-              output_tokens: outputTokens,
-              cost,
-              latency_ms: latency,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: enforcementReason
-            });
-            return response;
-          } catch (err) {
-            if (err?.caplyr) throw err;
-            shipper.push({
-              id: generateId2(),
-              timestamp: startTime,
-              provider: "openai",
-              model,
-              input_tokens: 0,
-              output_tokens: 0,
-              cost: 0,
-              latency_ms: Date.now() - startTime,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: "provider_error"
-            });
-            throw err;
+          } finally {
+            release();
           }
         };
       }

package/dist/index.mjs CHANGED Viewed

@@ -74,6 +74,36 @@ var LogShipper = class {
   }
 };
+// src/mutex.ts
+var Mutex = class {
+  constructor() {
+    this.queue = [];
+    this.locked = false;
+  }
+  async acquire() {
+    if (!this.locked) {
+      this.locked = true;
+      return this.createRelease();
+    }
+    return new Promise((resolve) => {
+      this.queue.push(() => resolve(this.createRelease()));
+    });
+  }
+  createRelease() {
+    let released = false;
+    return () => {
+      if (released) return;
+      released = true;
+      const next = this.queue.shift();
+      if (next) {
+        next();
+      } else {
+        this.locked = false;
+      }
+    };
+  }
+};
 // src/heartbeat.ts
 var Heartbeat = class {
   constructor(config) {
@@ -91,6 +121,8 @@ var Heartbeat = class {
     };
     /** Current protection status */
     this.status = "ACTIVE";
+    /** Mutex for serializing budget check → API call → trackSpend */
+    this.budgetMutex = new Mutex();
     /** Local budget limits set via config (not from server) */
     this.localDailyLimit = null;
     this.localMonthlyLimit = null;
@@ -349,18 +381,98 @@ function wrapAnthropic(client, config, shipper, heartbeat) {
               });
             }
           }
-          if (config.mode === "cost_protect") {
-            if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
-              blocked = true;
-              enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
-              const blockError = {
-                code: "BUDGET_EXCEEDED",
-                message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
-                budget_used: heartbeat.budgetStatus.monthly_used,
-                budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                retry_after: getNextResetTime(enforcementReason),
-                dashboard_url: dashboardUrl
-              };
+          const release = await heartbeat.budgetMutex.acquire();
+          try {
+            if (config.mode === "cost_protect") {
+              if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
+                blocked = true;
+                enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
+                const blockError = {
+                  code: "BUDGET_EXCEEDED",
+                  message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
+                  budget_used: heartbeat.budgetStatus.monthly_used,
+                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                  retry_after: getNextResetTime(enforcementReason),
+                  dashboard_url: dashboardUrl
+                };
+                shipper.push({
+                  id: generateId(),
+                  timestamp: startTime,
+                  provider: "anthropic",
+                  model,
+                  input_tokens: 0,
+                  output_tokens: 0,
+                  cost: 0,
+                  latency_ms: Date.now() - startTime,
+                  endpoint_tag: config.endpoint_tag,
+                  downgraded: false,
+                  blocked: true,
+                  enforcement_reason: enforcementReason
+                });
+                throw Object.assign(new Error(blockError.message), {
+                  caplyr: blockError
+                });
+              }
+              if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
+                const fallback = config.fallback ?? getDefaultFallback(model);
+                if (fallback && fallback !== model) {
+                  originalModel = model;
+                  model = fallback;
+                  downgraded = true;
+                  enforcementReason = "auto_downgrade_threshold";
+                  config.onEnforcement?.({
+                    type: "downgrade",
+                    timestamp: Date.now(),
+                    reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
+                    original_model: originalModel,
+                    fallback_model: model,
+                    budget_used: heartbeat.budgetStatus.monthly_used,
+                    budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                    estimated_savings: 0
+                    // Calculated after response
+                  });
+                }
+              }
+            }
+            const requestParams = downgraded ? { ...params, model } : params;
+            try {
+              const response = await target.create.call(
+                target,
+                requestParams,
+                options
+              );
+              const latency = Date.now() - startTime;
+              const inputTokens = response?.usage?.input_tokens ?? 0;
+              const outputTokens = response?.usage?.output_tokens ?? 0;
+              const cost = calculateCost(model, inputTokens, outputTokens);
+              heartbeat.trackSpend(cost);
+              let estimatedSavings = 0;
+              if (downgraded && originalModel) {
+                const originalCost = calculateCost(
+                  originalModel,
+                  inputTokens,
+                  outputTokens
+                );
+                estimatedSavings = originalCost - cost;
+              }
+              shipper.push({
+                id: generateId(),
+                timestamp: startTime,
+                provider: "anthropic",
+                model,
+                input_tokens: inputTokens,
+                output_tokens: outputTokens,
+                cost,
+                latency_ms: latency,
+                endpoint_tag: config.endpoint_tag,
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: enforcementReason
+              });
+              return response;
+            } catch (err) {
+              if (err?.caplyr) throw err;
               shipper.push({
                 id: generateId(),
                 timestamp: startTime,
@@ -371,90 +483,15 @@ function wrapAnthropic(client, config, shipper, heartbeat) {
                 cost: 0,
                 latency_ms: Date.now() - startTime,
                 endpoint_tag: config.endpoint_tag,
-                downgraded: false,
-                blocked: true,
-                enforcement_reason: enforcementReason
-              });
-              throw Object.assign(new Error(blockError.message), {
-                caplyr: blockError
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: "provider_error"
               });
+              throw err;
             }
-            if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
-              const fallback = config.fallback ?? getDefaultFallback(model);
-              if (fallback && fallback !== model) {
-                originalModel = model;
-                model = fallback;
-                downgraded = true;
-                enforcementReason = "auto_downgrade_threshold";
-                config.onEnforcement?.({
-                  type: "downgrade",
-                  timestamp: Date.now(),
-                  reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
-                  original_model: originalModel,
-                  fallback_model: model,
-                  budget_used: heartbeat.budgetStatus.monthly_used,
-                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                  estimated_savings: 0
-                  // Calculated after response
-                });
-              }
-            }
-          }
-          const requestParams = downgraded ? { ...params, model } : params;
-          try {
-            const response = await target.create.call(
-              target,
-              requestParams,
-              options
-            );
-            const latency = Date.now() - startTime;
-            const inputTokens = response?.usage?.input_tokens ?? 0;
-            const outputTokens = response?.usage?.output_tokens ?? 0;
-            const cost = calculateCost(model, inputTokens, outputTokens);
-            heartbeat.trackSpend(cost);
-            let estimatedSavings = 0;
-            if (downgraded && originalModel) {
-              const originalCost = calculateCost(
-                originalModel,
-                inputTokens,
-                outputTokens
-              );
-              estimatedSavings = originalCost - cost;
-            }
-            shipper.push({
-              id: generateId(),
-              timestamp: startTime,
-              provider: "anthropic",
-              model,
-              input_tokens: inputTokens,
-              output_tokens: outputTokens,
-              cost,
-              latency_ms: latency,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: enforcementReason
-            });
-            return response;
-          } catch (err) {
-            if (err?.caplyr) throw err;
-            shipper.push({
-              id: generateId(),
-              timestamp: startTime,
-              provider: "anthropic",
-              model,
-              input_tokens: 0,
-              output_tokens: 0,
-              cost: 0,
-              latency_ms: Date.now() - startTime,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: "provider_error"
-            });
-            throw err;
+          } finally {
+            release();
           }
         };
       }
@@ -531,18 +568,89 @@ function wrapOpenAI(client, config, shipper, heartbeat) {
               });
             }
           }
-          if (config.mode === "cost_protect") {
-            if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
-              blocked = true;
-              enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
-              const blockError = {
-                code: "BUDGET_EXCEEDED",
-                message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
-                budget_used: heartbeat.budgetStatus.monthly_used,
-                budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                retry_after: getNextResetTime2(enforcementReason),
-                dashboard_url: dashboardUrl
-              };
+          const release = await heartbeat.budgetMutex.acquire();
+          try {
+            if (config.mode === "cost_protect") {
+              if (heartbeat.isMonthlyBudgetExceeded() || heartbeat.isDailyBudgetExceeded()) {
+                blocked = true;
+                enforcementReason = heartbeat.isDailyBudgetExceeded() ? "daily_budget_exceeded" : "monthly_budget_exceeded";
+                const blockError = {
+                  code: "BUDGET_EXCEEDED",
+                  message: `AI budget exceeded. ${enforcementReason.replace(/_/g, " ")}.`,
+                  budget_used: heartbeat.budgetStatus.monthly_used,
+                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                  retry_after: getNextResetTime2(enforcementReason),
+                  dashboard_url: dashboardUrl
+                };
+                shipper.push({
+                  id: generateId2(),
+                  timestamp: startTime,
+                  provider: "openai",
+                  model,
+                  input_tokens: 0,
+                  output_tokens: 0,
+                  cost: 0,
+                  latency_ms: Date.now() - startTime,
+                  endpoint_tag: config.endpoint_tag,
+                  downgraded: false,
+                  blocked: true,
+                  enforcement_reason: enforcementReason
+                });
+                throw Object.assign(new Error(blockError.message), {
+                  caplyr: blockError
+                });
+              }
+              if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
+                const fallback = config.fallback ?? getDefaultFallback(model);
+                if (fallback && fallback !== model) {
+                  originalModel = model;
+                  model = fallback;
+                  downgraded = true;
+                  enforcementReason = "auto_downgrade_threshold";
+                  config.onEnforcement?.({
+                    type: "downgrade",
+                    timestamp: Date.now(),
+                    reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
+                    original_model: originalModel,
+                    fallback_model: model,
+                    budget_used: heartbeat.budgetStatus.monthly_used,
+                    budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
+                    estimated_savings: 0
+                  });
+                }
+              }
+            }
+            const requestParams = downgraded ? { ...params, model } : params;
+            try {
+              const response = await target.create.call(
+                target,
+                requestParams,
+                options
+              );
+              const latency = Date.now() - startTime;
+              const usage = response?.usage;
+              const inputTokens = usage?.prompt_tokens ?? 0;
+              const outputTokens = usage?.completion_tokens ?? 0;
+              const cost = calculateCost(model, inputTokens, outputTokens);
+              heartbeat.trackSpend(cost);
+              shipper.push({
+                id: generateId2(),
+                timestamp: startTime,
+                provider: "openai",
+                model,
+                input_tokens: inputTokens,
+                output_tokens: outputTokens,
+                cost,
+                latency_ms: latency,
+                endpoint_tag: config.endpoint_tag,
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: enforcementReason
+              });
+              return response;
+            } catch (err) {
+              if (err?.caplyr) throw err;
               shipper.push({
                 id: generateId2(),
                 timestamp: startTime,
@@ -553,81 +661,15 @@ function wrapOpenAI(client, config, shipper, heartbeat) {
                 cost: 0,
                 latency_ms: Date.now() - startTime,
                 endpoint_tag: config.endpoint_tag,
-                downgraded: false,
-                blocked: true,
-                enforcement_reason: enforcementReason
-              });
-              throw Object.assign(new Error(blockError.message), {
-                caplyr: blockError
+                downgraded,
+                original_model: originalModel,
+                blocked: false,
+                enforcement_reason: "provider_error"
               });
+              throw err;
             }
-            if (heartbeat.isDowngradeThresholdReached(downgradeThreshold)) {
-              const fallback = config.fallback ?? getDefaultFallback(model);
-              if (fallback && fallback !== model) {
-                originalModel = model;
-                model = fallback;
-                downgraded = true;
-                enforcementReason = "auto_downgrade_threshold";
-                config.onEnforcement?.({
-                  type: "downgrade",
-                  timestamp: Date.now(),
-                  reason: `Budget at ${Math.round(downgradeThreshold * 100)}% \u2014 downgraded ${originalModel} \u2192 ${model}`,
-                  original_model: originalModel,
-                  fallback_model: model,
-                  budget_used: heartbeat.budgetStatus.monthly_used,
-                  budget_limit: heartbeat.budgetStatus.monthly_limit ?? 0,
-                  estimated_savings: 0
-                });
-              }
-            }
-          }
-          const requestParams = downgraded ? { ...params, model } : params;
-          try {
-            const response = await target.create.call(
-              target,
-              requestParams,
-              options
-            );
-            const latency = Date.now() - startTime;
-            const usage = response?.usage;
-            const inputTokens = usage?.prompt_tokens ?? 0;
-            const outputTokens = usage?.completion_tokens ?? 0;
-            const cost = calculateCost(model, inputTokens, outputTokens);
-            heartbeat.trackSpend(cost);
-            shipper.push({
-              id: generateId2(),
-              timestamp: startTime,
-              provider: "openai",
-              model,
-              input_tokens: inputTokens,
-              output_tokens: outputTokens,
-              cost,
-              latency_ms: latency,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: enforcementReason
-            });
-            return response;
-          } catch (err) {
-            if (err?.caplyr) throw err;
-            shipper.push({
-              id: generateId2(),
-              timestamp: startTime,
-              provider: "openai",
-              model,
-              input_tokens: 0,
-              output_tokens: 0,
-              cost: 0,
-              latency_ms: Date.now() - startTime,
-              endpoint_tag: config.endpoint_tag,
-              downgraded,
-              original_model: originalModel,
-              blocked: false,
-              enforcement_reason: "provider_error"
-            });
-            throw err;
+          } finally {
+            release();
           }
         };
       }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "caplyr",
-  "version": "0.2.3",
+  "version": "0.2.4",
   "description": "AI Cost Control Plane — budget guardrails, auto-downgrade, and kill switch for AI API calls",
   "main": "dist/index.js",
   "module": "dist/index.mjs",