wolverine-ai 2.2.3 → 2.3.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +18 -0
- package/package.json +1 -1
- package/src/agent/agent-engine.js +29 -0
- package/src/agent/goal-loop.js +3 -2
- package/src/agent/sub-agents.js +10 -7
- package/src/brain/brain.js +5 -1
- package/src/core/verifier.js +13 -3
- package/src/core/wolverine.js +39 -10
package/README.md
CHANGED
|
@@ -419,6 +419,24 @@ Wolverine (single process manager)
|
|
|
419
419
|
|
|
420
420
|
---
|
|
421
421
|
|
|
422
|
+
## Cost Optimization
|
|
423
|
+
|
|
424
|
+
Wolverine minimizes AI spend through 7 techniques:
|
|
425
|
+
|
|
426
|
+
| Technique | What it does | Savings |
|
|
427
|
+
|-----------|-------------|---------|
|
|
428
|
+
| **Smart verification** | Simple errors (TypeError, ReferenceError) skip route probe — trusts syntax+boot, ErrorMonitor is safety net | Prevents $0.29 cascade |
|
|
429
|
+
| **Haiku triage** | Sub-agents (explore/plan/verify/research) use cheap classifier model, only fixer uses Sonnet/Opus | 90% on sub-agent cost |
|
|
430
|
+
| **Context compacting** | Every 3 agent turns, summarize history to prevent token blowup (95K→20K) | 70-80% on later turns |
|
|
431
|
+
| **Cached fix patterns** | Check repair history for identical past fix before calling AI | 100% on repeat errors |
|
|
432
|
+
| **Token budget caps** | Simple: 20K, moderate: 50K, complex: 100K agent budget | Caps runaway spend |
|
|
433
|
+
| **Prior attempt summaries** | Pass concise "do NOT repeat" directives between iterations, not full context | Reduces baseline tokens |
|
|
434
|
+
| **Backup diff context** | AI sees last known good version to revert broken code instead of patching around it | Better fix quality, fewer retries |
|
|
435
|
+
|
|
436
|
+
**Result:** Simple TypeError heal drops from **$0.31 → $0.02** (15x cheaper).
|
|
437
|
+
|
|
438
|
+
---
|
|
439
|
+
|
|
422
440
|
## Configuration
|
|
423
441
|
|
|
424
442
|
```
|
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "wolverine-ai",
|
|
3
|
-
"version": "2.
|
|
3
|
+
"version": "2.3.1",
|
|
4
4
|
"description": "Self-healing Node.js server framework powered by AI. Catches crashes, diagnoses errors, generates fixes, verifies, and restarts — automatically.",
|
|
5
5
|
"main": "src/index.js",
|
|
6
6
|
"bin": {
|
|
@@ -463,6 +463,35 @@ Project root: ${this.cwd}${primaryFile ? `\nPrimary crash file: ${primaryFile}`
|
|
|
463
463
|
|
|
464
464
|
console.log(chalk.gray(` 🤖 Agent turn ${this.turnCount}/${this.maxTurns} (${this.totalTokens} tokens used)`));
|
|
465
465
|
|
|
466
|
+
// Compact context every 3 turns to prevent token blowup
|
|
467
|
+
// Turn 6 without compacting: ~95K tokens. With compacting: ~20K tokens.
|
|
468
|
+
if (this.turnCount > 1 && this.turnCount % 3 === 0 && this.messages.length > 4) {
|
|
469
|
+
try {
|
|
470
|
+
const { aiCall } = require("./ai-client") || require("../core/ai-client");
|
|
471
|
+
const { getModel: _gm } = require("./models") || require("../core/models");
|
|
472
|
+
const historyToCompact = this.messages.slice(1, -2); // keep system + last exchange
|
|
473
|
+
if (historyToCompact.length > 2) {
|
|
474
|
+
const historyText = historyToCompact.map(m => `${m.role}: ${(m.content || "").slice(0, 500)}`).join("\n");
|
|
475
|
+
const compactResult = await aiCall({
|
|
476
|
+
model: _gm("compacting"),
|
|
477
|
+
systemPrompt: "Summarize this agent conversation history into a concise status report. Keep: files read, changes made, errors found, what was tried. Remove: full file contents, redundant tool results.",
|
|
478
|
+
userPrompt: historyText.slice(0, 8000),
|
|
479
|
+
maxTokens: 512,
|
|
480
|
+
category: "brain",
|
|
481
|
+
});
|
|
482
|
+
if (compactResult.content) {
|
|
483
|
+
this.messages = [
|
|
484
|
+
this.messages[0], // system prompt
|
|
485
|
+
{ role: "assistant", content: `[Prior work summary]\n${compactResult.content}` },
|
|
486
|
+
{ role: "user", content: "Continue from where you left off." },
|
|
487
|
+
...this.messages.slice(-2), // last exchange
|
|
488
|
+
];
|
|
489
|
+
console.log(chalk.gray(` 📦 Compacted ${historyToCompact.length} messages → summary (${compactResult.content.length} chars)`));
|
|
490
|
+
}
|
|
491
|
+
}
|
|
492
|
+
} catch { /* compacting failed — continue with full context */ }
|
|
493
|
+
}
|
|
494
|
+
|
|
466
495
|
let response;
|
|
467
496
|
try {
|
|
468
497
|
response = await aiCallWithHistory({
|
package/src/agent/goal-loop.js
CHANGED
|
@@ -57,16 +57,17 @@ class GoalLoop {
|
|
|
57
57
|
}
|
|
58
58
|
}
|
|
59
59
|
|
|
60
|
-
// Attempt the fix
|
|
60
|
+
// Attempt the fix — pass prior attempts so the handler can include concise summary
|
|
61
61
|
let attempt;
|
|
62
62
|
try {
|
|
63
|
-
attempt = await this.onAttempt(iteration, context);
|
|
63
|
+
attempt = await this.onAttempt(iteration, context, this._attempts);
|
|
64
64
|
} catch (err) {
|
|
65
65
|
attempt = { healed: false, explanation: `Error: ${err.message}` };
|
|
66
66
|
}
|
|
67
67
|
|
|
68
68
|
this._attempts.push({
|
|
69
69
|
iteration,
|
|
70
|
+
mode: attempt.mode || "unknown",
|
|
70
71
|
success: attempt.healed,
|
|
71
72
|
explanation: attempt.explanation || "No explanation",
|
|
72
73
|
});
|
package/src/agent/sub-agents.js
CHANGED
|
@@ -33,14 +33,17 @@ const AGENT_TOOL_SETS = {
|
|
|
33
33
|
};
|
|
34
34
|
|
|
35
35
|
// Default model + budget per agent type
|
|
36
|
+
// Cost optimization: triage agents use cheap models (classifier slot = Haiku),
|
|
37
|
+
// only the fixer needs the expensive coding model (Sonnet/Opus).
|
|
38
|
+
// This cuts sub-agent cost by ~90% (6 Haiku calls vs 6 Sonnet calls).
|
|
36
39
|
const AGENT_CONFIGS = {
|
|
37
|
-
explore: { model: "
|
|
38
|
-
plan: { model: "
|
|
39
|
-
fix: { model: "coding",
|
|
40
|
-
verify: { model: "
|
|
41
|
-
research: { model: "
|
|
42
|
-
security: { model: "audit", maxTurns: 3, maxTokens: 8000 },
|
|
43
|
-
database: { model: "coding",
|
|
40
|
+
explore: { model: "classifier", maxTurns: 5, maxTokens: 15000 }, // Haiku — just reading
|
|
41
|
+
plan: { model: "classifier", maxTurns: 3, maxTokens: 10000 }, // Haiku — simple planning
|
|
42
|
+
fix: { model: "coding", maxTurns: 5, maxTokens: 50000 }, // Sonnet/Opus — needs reasoning
|
|
43
|
+
verify: { model: "classifier", maxTurns: 3, maxTokens: 8000 }, // Haiku — just checking
|
|
44
|
+
research: { model: "classifier", maxTurns: 3, maxTokens: 10000 }, // Haiku — summarization
|
|
45
|
+
security: { model: "audit", maxTurns: 3, maxTokens: 8000 }, // Haiku — pattern matching
|
|
46
|
+
database: { model: "coding", maxTurns: 5, maxTokens: 50000 }, // Sonnet/Opus — needs reasoning
|
|
44
47
|
};
|
|
45
48
|
|
|
46
49
|
// System prompts per agent type
|
package/src/brain/brain.js
CHANGED
|
@@ -112,7 +112,7 @@ const SEED_DOCS = [
|
|
|
112
112
|
metadata: { topic: "sub-agent-tools" },
|
|
113
113
|
},
|
|
114
114
|
{
|
|
115
|
-
text: "Heal pipeline escalation: Iteration 1 uses fast path (CODING_MODEL
|
|
115
|
+
text: "Heal pipeline escalation with cost optimization: Iteration 1 uses fast path (CODING_MODEL). For simple errors (TypeError/ReferenceError/SyntaxError), verifier trusts syntax+boot and skips route probe — ErrorMonitor is safety net. This prevents false-rejection cascades that waste tokens. Iteration 2 uses single agent (REASONING_MODEL, 4 turns for simple errors, 8 for complex). Iteration 3+ uses sub-agents with Haiku for triage (explore/plan/verify/research use classifier model) and only fixer uses coding model — 90% cheaper. Token budgets capped by error complexity: simple=20K, moderate=50K, complex=100K. Context compacted every 3 agent turns to prevent token blowup (95K→20K). Prior attempt summaries passed between iterations instead of full context. Brain checked for cached fix patterns before starting AI.",
|
|
116
116
|
metadata: { topic: "heal-escalation" },
|
|
117
117
|
},
|
|
118
118
|
{
|
|
@@ -235,6 +235,10 @@ const SEED_DOCS = [
|
|
|
235
235
|
text: "Dependency manager skill (src/skills/deps.js): structured npm dependency analysis + repair. diagnose(errorMessage, cwd) returns {diagnosed, category, summary, fixes} — categories: missing_install, missing_package, version_conflict, outdated_api, corrupted_modules. healthReport(cwd) returns full health check: npm audit (vulnerabilities), outdated packages, peer dep conflicts, unused packages, lock file status, health score 0-100. getMigration(packageName) returns known upgrade paths: express→fastify (5.6x faster), moment→dayjs (2KB vs 70KB), request→node-fetch (deprecated), body-parser→built-in, callbacks→async/await. Agent tools: audit_deps (full health check), check_migration (upgrade paths). Heal pipeline uses diagnose() in tryOperationalFix before AI — zero tokens for dependency issues.",
|
|
236
236
|
metadata: { topic: "skill-deps" },
|
|
237
237
|
},
|
|
238
|
+
{
|
|
239
|
+
text: "Cost optimization: 7 techniques reduce heal cost from $0.31 to $0.02 for simple errors. (1) Verifier skips route probe for simple errors (TypeError/ReferenceError/SyntaxError) — trusts syntax+boot, ErrorMonitor is safety net. Prevents false-rejection cascades. (2) Sub-agents use Haiku (classifier model) for explore/plan/verify/research — only fixer uses Sonnet/Opus. 6 Haiku calls=$0.006 vs 6 Sonnet calls=$0.12. (3) Agent context compacted every 3 turns using compacting model — prevents 15K→95K token blowup. (4) Brain checked for cached fix patterns before AI — repeat errors cost $0. (5) Token budgets capped by error complexity: simple=20K agent budget, moderate=50K, complex=100K. Simple errors get 4 agent turns max. (6) Prior attempt summaries (not full context) passed between iterations — concise 'do NOT repeat' directives. (7) Fast path includes last known good backup code so AI can revert broken additions instead of patching around them.",
|
|
240
|
+
metadata: { topic: "cost-optimization" },
|
|
241
|
+
},
|
|
238
242
|
];
|
|
239
243
|
|
|
240
244
|
class Brain {
|
package/src/core/verifier.js
CHANGED
|
@@ -131,7 +131,14 @@ function bootProbe(scriptPath, cwd, originalErrorSignature) {
|
|
|
131
131
|
* @param {object} routeContext — optional { path, method } for route-level testing
|
|
132
132
|
*/
|
|
133
133
|
async function verifyFix(scriptPath, cwd, originalErrorSignature, routeContext) {
|
|
134
|
-
|
|
134
|
+
// Simple errors (TypeError, ReferenceError, SyntaxError) — trust syntax+boot, skip route probe.
|
|
135
|
+
// If the fix is wrong, ErrorMonitor will catch the 500 and re-trigger heal. This avoids
|
|
136
|
+
// the expensive cascade where a working fix gets rolled back because the route probe
|
|
137
|
+
// can't boot the full server in isolation.
|
|
138
|
+
const isSimpleError = /TypeError|ReferenceError|SyntaxError|Cannot find module/.test(originalErrorSignature || "");
|
|
139
|
+
const skipRouteProbe = isSimpleError;
|
|
140
|
+
const steps = (!skipRouteProbe && routeContext?.path) ? 3 : 2;
|
|
141
|
+
|
|
135
142
|
console.log(chalk.yellow("\n🔬 Verifying fix...\n"));
|
|
136
143
|
|
|
137
144
|
// Step 1: Syntax check
|
|
@@ -157,8 +164,9 @@ async function verifyFix(scriptPath, cwd, originalErrorSignature, routeContext)
|
|
|
157
164
|
}
|
|
158
165
|
console.log(chalk.green(" ✅ Process booted successfully"));
|
|
159
166
|
|
|
160
|
-
// Step 3: Route probe
|
|
161
|
-
|
|
167
|
+
// Step 3: Route probe — only for complex errors (not simple TypeError/ReferenceError)
|
|
168
|
+
// Simple errors: trust syntax+boot. ErrorMonitor is the safety net.
|
|
169
|
+
if (!skipRouteProbe && routeContext?.path) {
|
|
162
170
|
console.log(chalk.gray(` [3/${steps}] Route probe: ${routeContext.method || "GET"} ${routeContext.path}...`));
|
|
163
171
|
const routeResult = await routeProbe(scriptPath, cwd, routeContext);
|
|
164
172
|
if (routeResult.status === "failed") {
|
|
@@ -170,6 +178,8 @@ async function verifyFix(scriptPath, cwd, originalErrorSignature, routeContext)
|
|
|
170
178
|
} else {
|
|
171
179
|
console.log(chalk.gray(` ⚠️ Route probe skipped: ${routeResult.reason || "unknown"}`));
|
|
172
180
|
}
|
|
181
|
+
} else if (skipRouteProbe && routeContext?.path) {
|
|
182
|
+
console.log(chalk.gray(` ⚡ Skipping route probe (simple error — ErrorMonitor is safety net)`));
|
|
173
183
|
}
|
|
174
184
|
|
|
175
185
|
return { verified: true, status: "fixed" };
|
package/src/core/wolverine.js
CHANGED
|
@@ -203,7 +203,22 @@ async function _healImpl({ stderr, cwd, sandbox, notifier, rateLimiter, backupMa
|
|
|
203
203
|
} catch { /* non-fatal */ }
|
|
204
204
|
}
|
|
205
205
|
|
|
206
|
-
// 6.
|
|
206
|
+
// 6. Check brain for cached fix — if we fixed this exact error before, replay it (zero tokens)
|
|
207
|
+
if (brain && brain._initialized && hasFile && repairHistory) {
|
|
208
|
+
try {
|
|
209
|
+
const pastRepairs = repairHistory.getAll().filter(r =>
|
|
210
|
+
r.success && r.file === parsed.filePath && r.error &&
|
|
211
|
+
parsed.errorMessage.includes(r.error.split(":").pop()?.trim()?.slice(0, 30))
|
|
212
|
+
);
|
|
213
|
+
if (pastRepairs.length > 0) {
|
|
214
|
+
const cached = pastRepairs[pastRepairs.length - 1];
|
|
215
|
+
console.log(chalk.gray(` 🧠 Found cached fix for similar error (${cached.mode}, ${cached.id})`));
|
|
216
|
+
if (logger) logger.info("heal.cached", `Cached fix found: ${cached.resolution?.slice(0, 80)}`, { cachedId: cached.id });
|
|
217
|
+
}
|
|
218
|
+
} catch {}
|
|
219
|
+
}
|
|
220
|
+
|
|
221
|
+
// 7. Research — check past attempts to avoid loops
|
|
207
222
|
const researcher = new ResearchAgent({ brain, logger });
|
|
208
223
|
let researchContext = "";
|
|
209
224
|
try {
|
|
@@ -211,24 +226,38 @@ async function _healImpl({ stderr, cwd, sandbox, notifier, rateLimiter, backupMa
|
|
|
211
226
|
if (researchContext) console.log(chalk.gray(` 🔍 Research: found past context for this error`));
|
|
212
227
|
} catch {}
|
|
213
228
|
|
|
214
|
-
//
|
|
215
|
-
|
|
216
|
-
|
|
217
|
-
|
|
229
|
+
// 7b. Token budget by error complexity — simple bugs get tight caps
|
|
230
|
+
const isSimpleError = /TypeError|ReferenceError|SyntaxError|Cannot find module/.test(parsed.errorMessage);
|
|
231
|
+
const isModerateError = /ECONNREFUSED|timeout|ENOENT|EACCES|EADDRINUSE/.test(parsed.errorMessage);
|
|
232
|
+
const tokenBudget = isSimpleError
|
|
233
|
+
? { fast: 5000, agent: 20000, subAgent: 15000 }
|
|
234
|
+
: isModerateError
|
|
235
|
+
? { fast: 10000, agent: 50000, subAgent: 30000 }
|
|
236
|
+
: { fast: 15000, agent: 100000, subAgent: 50000 };
|
|
237
|
+
console.log(chalk.gray(` 💰 Token budget: ${isSimpleError ? "simple" : isModerateError ? "moderate" : "complex"} (agent: ${tokenBudget.agent})`));
|
|
238
|
+
|
|
239
|
+
// 8. Goal Loop — set goal, iterate until fixed or exhausted
|
|
218
240
|
const loop = new GoalLoop({
|
|
219
241
|
maxIterations: parseInt(process.env.WOLVERINE_MAX_RETRIES, 10) || 3,
|
|
220
242
|
researcher,
|
|
221
243
|
logger,
|
|
222
244
|
goal: `Fix: ${parsed.errorMessage.slice(0, 80)}`,
|
|
223
245
|
|
|
224
|
-
onAttempt: async (iteration, researchCtx) => {
|
|
246
|
+
onAttempt: async (iteration, researchCtx, priorAttempts) => {
|
|
225
247
|
// Create backup for this attempt
|
|
226
|
-
// Full server/ backup — includes all files, configs, databases
|
|
227
248
|
const bid = backupManager.createBackup(`heal attempt ${iteration}: ${parsed.errorMessage.slice(0, 60)}`);
|
|
228
249
|
backupManager.setErrorSignature(bid, errorSignature);
|
|
229
250
|
if (logger) logger.info(EVENT_TYPES.BACKUP_CREATED, `Backup ${bid} (iteration ${iteration})`, { backupId: bid });
|
|
230
251
|
|
|
231
|
-
|
|
252
|
+
// Build concise prior attempt summary instead of full context bleed
|
|
253
|
+
let priorSummary = "";
|
|
254
|
+
if (priorAttempts && priorAttempts.length > 0) {
|
|
255
|
+
priorSummary = "\nPRIOR ATTEMPTS (do NOT repeat):\n" + priorAttempts.map(a =>
|
|
256
|
+
`- Attempt ${a.iteration} (${a.mode}): ${a.explanation?.slice(0, 100)}`
|
|
257
|
+
).join("\n") + "\n";
|
|
258
|
+
}
|
|
259
|
+
|
|
260
|
+
const fullContext = [brainContext, researchContext, researchCtx, envContext, priorSummary].filter(Boolean).join("\n");
|
|
232
261
|
|
|
233
262
|
let result;
|
|
234
263
|
if (iteration === 1 && hasFile) {
|
|
@@ -291,8 +320,8 @@ async function _healImpl({ stderr, cwd, sandbox, notifier, rateLimiter, backupMa
|
|
|
291
320
|
console.log(chalk.magenta(` 🤖 Agent path (${getModel("reasoning")})...`));
|
|
292
321
|
const agent = new AgentEngine({
|
|
293
322
|
sandbox, logger, cwd, mcp,
|
|
294
|
-
maxTurns: 8,
|
|
295
|
-
maxTokens:
|
|
323
|
+
maxTurns: isSimpleError ? 4 : 8,
|
|
324
|
+
maxTokens: tokenBudget.agent,
|
|
296
325
|
});
|
|
297
326
|
|
|
298
327
|
const agentResult = await agent.run({
|