npm - wolverine-ai - Versions diffs - 3.7.6 → 3.7.8 - Mend

wolverine-ai 3.7.6 → 3.7.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "wolverine-ai",
-  "version": "3.7.6",
+  "version": "3.7.8",
   "description": "Self-healing Node.js server framework powered by AI. Catches crashes, diagnoses errors, generates fixes, verifies, and restarts — automatically.",
   "main": "src/index.js",
   "bin": {

package/src/agent/agent-engine.js CHANGED Viewed

@@ -331,6 +331,7 @@ class AgentEngine {
     this.logger = options.logger;
     this.cwd = options.cwd || process.cwd();
     this.mcp = options.mcp || null; // McpRegistry for external tools
+    this.category = options.category || "tool"; // Analytics category for token tracking
     // Budget constraints (claw-code: QueryEngineConfig)
     this.maxTurns = options.maxTurns || 15;
@@ -422,6 +423,7 @@ class AgentEngine {
             messages: this.messages,
             tools: allTools,
             maxTokens: 4096,
+            category: this.category,
           }),
           new Promise((_, reject) => setTimeout(() => reject(new Error(`AI call timed out after ${AI_CALL_TIMEOUT_MS / 1000}s`)), AI_CALL_TIMEOUT_MS)),
         ]);

package/src/agent/sub-agents.js CHANGED Viewed

@@ -97,6 +97,8 @@ async function spawnAgent(type, task, options = {}) {
     });
   }
+  // Map sub-agent type to analytics category: triage agents = classifier, fix/db = coding
+  const categoryMap = { explore: "classifier", plan: "classifier", verify: "classifier", research: "research", fix: "coding", database: "coding", security: "audit" };
   const agent = new AgentEngine({
     sandbox: options.sandbox,
     logger: options.logger,
@@ -104,6 +106,7 @@ async function spawnAgent(type, task, options = {}) {
     mcp: options.mcp,
     maxTurns: config.maxTurns,
     maxTokens: config.maxTokens,
+    category: categoryMap[type] || "tool",
   });
   // Override the system prompt for this agent type

package/src/brain/brain.js CHANGED Viewed

@@ -114,7 +114,7 @@ const SEED_DOCS = [
     metadata: { topic: "sub-agent-tools" },
   },
   {
-    text: "Heal pipeline escalation with cost optimization: Iteration 1 uses fast path (CODING_MODEL). For simple errors (TypeError/ReferenceError/SyntaxError), verifier trusts syntax+boot and skips route probe — ErrorMonitor is safety net. This prevents false-rejection cascades that waste tokens. Iteration 2 uses single agent (REASONING_MODEL, 4 turns for simple errors, 8 for complex). Iteration 3+ uses sub-agents with Haiku for triage (explore/plan/verify/research use classifier model) and only fixer uses coding model — 90% cheaper. Token budgets capped by error complexity: simple=20K, moderate=50K, complex=100K. Context compacted every 3 agent turns to prevent token blowup (95K→20K). Prior attempt summaries passed between iterations instead of full context. Brain checked for cached fix patterns before starting AI.",
+    text: "Heal pipeline escalation with cost optimization: Iteration 1 uses fast path (CODING_MODEL, tracked as 'coding' category). For simple errors (TypeError/ReferenceError/SyntaxError), verifier trusts syntax+boot and skips route probe — ErrorMonitor is safety net. Iteration 2 uses single agent (REASONING_MODEL, 4 turns for simple, 8 for complex, tracked as 'tool' category). Iteration 3+ uses sub-agents: explore/plan/verify use classifier model (tracked as 'classifier'), fixer uses coding model (tracked as 'coding'), research sub-agent tracked as 'research', security as 'audit'. All calls billed through unified credit system — framework authenticates as a normal API user via WOLVERINE_API_KEY through the billing proxy. Billing errors (402, insufficient_quota) immediately stop healing, no token waste.",
     metadata: { topic: "heal-escalation" },
   },
   {
@@ -146,7 +146,7 @@ const SEED_DOCS = [
     metadata: { topic: "fastify" },
   },
   {
-    text: "npm package: wolverine-ai on npmjs.com. Install: npm i wolverine-ai. CLI: npx wolverine server/index.js. v1.0.0, 79 files, 125KB compressed. Includes src/, bin/, server/, examples/. GitHub: https://github.com/bobbyswhip/Wolverine",
+    text: "npm package: wolverine-ai on npmjs.com (v3.7.7). Install: npm i wolverine-ai. CLI: npx wolverine server/index.js. 85 files, 190KB compressed. Includes src/, bin/, examples/. Server directory created from src/templates/server/ on first run (never overwritten). GitHub: https://github.com/bobbyswhip/Wolverine. Unified billing: all AI calls route through inference proxy with credit-based billing. WOLVERINE_API_KEY authenticates through billing proxy, WOLVERINE_GPU_KEY for direct GPU access. 3 providers: openai, anthropic, wolverine (self-hosted GPU via Vast.ai).",
     metadata: { topic: "npm-package" },
   },
   {
@@ -162,7 +162,7 @@ const SEED_DOCS = [
     metadata: { topic: "smart-edit" },
   },
   {
-    text: "Token tracking: every AI call tracked with input/output tokens, USD cost, latencyMs, and success/failure. Per-model KPIs: avgLatencyMs, minLatencyMs, maxLatencyMs, tokensPerSecond, successRate, costPerCall, successes, failures. Aggregated by model, by category, by tool, by provider (openai/anthropic). Persisted to .wolverine/usage.json + .wolverine/usage-history.jsonl. Pricing includes both OpenAI (gpt-5.x, o4, codex) and Anthropic (opus-4, sonnet-4, haiku-4) families. Customizable via .wolverine/pricing.json. Telemetry sends all per-model performance data to platform backend for fleet-wide cost:speed:reliability analysis.",
+    text: "Token tracking: every AI call tracked with input/output tokens, USD cost, latencyMs, and success/failure. Per-model KPIs: avgLatencyMs, minLatencyMs, maxLatencyMs, tokensPerSecond, successRate, costPerCall, successes, failures. Aggregated by model, by category, by tool, by provider (openai/anthropic/wolverine). 9 analytics categories match the 9 settings.json model roles: reasoning (deep debugging), coding (fast path repair + fix sub-agents), chat (dashboard), tool (main agent with tool use), classifier (triage sub-agents: explore/plan/verify), audit (injection scan + security sub-agent), compacting (brain text compression), research (research agent + research sub-agent), embedding (brain vector embeddings). All categories tracked in byModelCategory cross-reference for per-task model comparison. Persisted to .wolverine/usage.json + .wolverine/usage-history.jsonl. Telemetry sends all per-model performance data to platform backend for fleet-wide analytics.",
     metadata: { topic: "token-tracking" },
   },
   {

package/src/brain/embedder.js CHANGED Viewed

@@ -1,4 +1,4 @@
-const { getClient, aiCall, detectProvider } = require("../core/ai-client");
+const { getClient, aiCall, detectProvider, _trackEmbedding } = require("../core/ai-client");
 const { getModel } = require("../core/models");
 /**
@@ -45,12 +45,14 @@ async function embed(text) {
   const openai = getClient("openai");
   const model = getModel("embedding");
+  const startMs = Date.now();
   const response = await openai.embeddings.create({
     model,
     input: text,
   });
   const embedding = response.data[0].embedding;
+  _trackEmbedding(model, response.usage, Date.now() - startMs, true);
   _cacheSet(text, embedding);
   return embedding;
 }
@@ -83,10 +85,12 @@ async function embedBatch(texts) {
   const openai = getClient("openai");
   const model = getModel("embedding");
+  const startMs = Date.now();
   const response = await openai.embeddings.create({
     model,
     input: uncached,
   });
+  _trackEmbedding(model, response.usage, Date.now() - startMs, true);
   // Sort by index to maintain order
   const sorted = response.data.sort((a, b) => a.index - b.index);

package/src/core/ai-client.js CHANGED Viewed

@@ -32,6 +32,12 @@ function _track(model, category, usage, tool, latencyMs, success) {
   _tracker.record(model, category, input, output, tool, latencyMs, success, cacheCreation, cacheRead);
 }
+function _trackEmbedding(model, usage, latencyMs, success) {
+  if (!_tracker) return;
+  const input = usage?.prompt_tokens || usage?.total_tokens || 0;
+  _tracker.record(model, "embedding", input, 0, null, latencyMs, success, 0, 0);
+}
 // ── Client Management ──
 function getClient(provider) {
@@ -619,4 +625,4 @@ Include both if needed, or just one.`;
   }
 }
-module.exports = { requestRepair, getClient, tokenParam, aiCall, aiCallWithHistory, isResponsesModel, isAnthropicModel, setTokenTracker, getTrackerSnapshot, detectProvider };
+module.exports = { requestRepair, getClient, tokenParam, aiCall, aiCallWithHistory, isResponsesModel, isAnthropicModel, setTokenTracker, getTrackerSnapshot, detectProvider, _trackEmbedding };