npm - wolverine-ai - Versions diffs - 3.7.4 → 3.7.6 - Mend

wolverine-ai 3.7.4 → 3.7.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json +1 -1
package/src/core/ai-client.js +19 -5
package/src/notifications/notifier.js +7 -1

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "wolverine-ai",
-  "version": "3.7.4",
+  "version": "3.7.6",
   "description": "Self-healing Node.js server framework powered by AI. Catches crashes, diagnoses errors, generates fixes, verifies, and restarts — automatically.",
   "main": "src/index.js",
   "bin": {

package/src/core/ai-client.js CHANGED Viewed

@@ -42,13 +42,14 @@ function getClient(provider) {
 function _getWolverineClient() {
   if (!_wolverineClient) {
-    // Wolverine inference: direct to GPU or via proxy
-    // WOLVERINE_GPU_KEY = internal key for direct GPU access (llama.cpp --api-key)
-    // WOLVERINE_API_KEY = user key for billed proxy access (api.wolverinenode.xyz)
+    // Wolverine inference: always route through billing proxy when API key is set.
+    // WOLVERINE_API_KEY = billed API key (credits deducted per call)
+    // WOLVERINE_GPU_KEY = direct GPU access (no billing, admin/internal only)
+    // Priority: API_KEY (billed) > GPU_KEY (direct) — billing is the default path
+    const apiKey = process.env.WOLVERINE_API_KEY || process.env.WOLVERINE_GPU_KEY || "none";
     const baseURL = process.env.WOLVERINE_INFERENCE_URL
       ? process.env.WOLVERINE_INFERENCE_URL + "/v1"
       : "https://api.wolverinenode.xyz/v1";
-    const apiKey = process.env.WOLVERINE_GPU_KEY || process.env.WOLVERINE_API_KEY || "none";
     _wolverineClient = new OpenAI({ apiKey, baseURL });
   }
   return _wolverineClient;
@@ -169,7 +170,20 @@ async function _withRetry(fn, maxRetries = 3) {
     try {
       return await fn();
     } catch (err) {
-      const isRateLimit = err.status === 429 || err.code === "rate_limit_exceeded";
+      const msg = (err.message || "").toLowerCase();
+      const code = (err.code || "").toLowerCase();
+      // Permanent billing/quota errors — never retry, surface immediately
+      const isBillingError = err.status === 402
+        || /insufficient.*(quota|credits|funds)/i.test(msg)
+        || /billing_hard_limit|insufficient_quota|quota_exceeded/i.test(msg)
+        || /billing_hard_limit|insufficient_quota|quota_exceeded/i.test(code);
+      if (isBillingError) {
+        console.log(chalk.red(`  💳 Billing error (not retrying): ${err.message}`));
+        throw err;
+      }
+      const isRateLimit = err.status === 429 || code === "rate_limit_exceeded";
       const isServerError = err.status >= 500;
       if ((isRateLimit || isServerError) && attempt < maxRetries) {
         const delay = Math.min(1000 * Math.pow(2, attempt) + Math.random() * 1000, 30000);

package/src/notifications/notifier.js CHANGED Viewed

@@ -29,11 +29,17 @@ const HUMAN_REQUIRED_PATTERNS = [
   { pattern: /(api|auth|token|key|credential).*(expired|revoked|rotated|invalid)/i, category: "auth", hint: "Credential has expired or been revoked" },
   { pattern: /authentication\s+failed/i, category: "auth", hint: "Authentication failed — check credentials" },
-  // Billing/Quota
+  // Billing/Quota — covers OpenAI, Anthropic, Wolverine, and generic patterns
   { pattern: /429\s*(too many|rate limit)/i, category: "billing", hint: "Rate limit hit — may need to upgrade plan or wait" },
   { pattern: /(quota|limit|credits?)\s*(exceeded|exhausted|depleted)/i, category: "billing", hint: "Usage quota or credits exhausted" },
   { pattern: /billing.*(?:issue|error|failed|inactive)/i, category: "billing", hint: "Billing issue on the account" },
   { pattern: /insufficient.*(funds|credits|quota)/i, category: "billing", hint: "Insufficient credits or funds" },
+  { pattern: /billing_hard_limit_reached/i, category: "billing", hint: "OpenAI billing hard limit reached — add payment method or raise limit" },
+  { pattern: /insufficient_quota/i, category: "billing", hint: "API quota exhausted — check billing dashboard" },
+  { pattern: /rate_limit_exceeded/i, category: "billing", hint: "API rate limit exceeded — wait or upgrade plan" },
+  { pattern: /402\s*(payment|required)/i, category: "billing", hint: "Payment required — check billing status" },
+  { pattern: /exceeded.*(?:budget|spending|token)/i, category: "billing", hint: "Spending or token budget exceeded" },
+  { pattern: /overloaded_error/i, category: "billing", hint: "Anthropic API overloaded — retry later" },
   // External service failures
   { pattern: /ECONNREFUSED/i, category: "service", hint: "External service connection refused — is it running?" },