npm - daemora - Versions diffs - 1.0.0 - Mend

daemora 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

package/README.md +666 -0
package/SOUL.md +104 -0
package/config/hooks.json +14 -0
package/config/mcp.json +145 -0
package/package.json +86 -0
package/skills/.gitkeep +0 -0
package/skills/apple-notes.md +193 -0
package/skills/apple-reminders.md +189 -0
package/skills/camsnap.md +162 -0
package/skills/coding.md +14 -0
package/skills/documents.md +13 -0
package/skills/email.md +13 -0
package/skills/gif-search.md +196 -0
package/skills/healthcheck.md +225 -0
package/skills/image-gen.md +147 -0
package/skills/model-usage.md +182 -0
package/skills/obsidian.md +207 -0
package/skills/pdf.md +211 -0
package/skills/research.md +13 -0
package/skills/skill-creator.md +142 -0
package/skills/spotify.md +149 -0
package/skills/summarize.md +230 -0
package/skills/things.md +199 -0
package/skills/tmux.md +204 -0
package/skills/trello.md +183 -0
package/skills/video-frames.md +202 -0
package/skills/weather.md +127 -0
package/src/a2a/A2AClient.js +136 -0
package/src/a2a/A2AServer.js +316 -0
package/src/a2a/AgentCard.js +79 -0
package/src/agents/SubAgentManager.js +369 -0
package/src/agents/Supervisor.js +192 -0
package/src/channels/BaseChannel.js +104 -0
package/src/channels/DiscordChannel.js +288 -0
package/src/channels/EmailChannel.js +172 -0
package/src/channels/GoogleChatChannel.js +316 -0
package/src/channels/HttpChannel.js +26 -0
package/src/channels/LineChannel.js +168 -0
package/src/channels/SignalChannel.js +186 -0
package/src/channels/SlackChannel.js +329 -0
package/src/channels/TeamsChannel.js +272 -0
package/src/channels/TelegramChannel.js +347 -0
package/src/channels/WhatsAppChannel.js +219 -0
package/src/channels/index.js +198 -0
package/src/cli.js +1267 -0
package/src/config/agentProfiles.js +120 -0
package/src/config/channels.js +32 -0
package/src/config/default.js +206 -0
package/src/config/models.js +123 -0
package/src/config/permissions.js +167 -0
package/src/core/AgentLoop.js +446 -0
package/src/core/Compaction.js +143 -0
package/src/core/CostTracker.js +116 -0
package/src/core/EventBus.js +46 -0
package/src/core/Task.js +67 -0
package/src/core/TaskQueue.js +206 -0
package/src/core/TaskRunner.js +226 -0
package/src/daemon/DaemonManager.js +301 -0
package/src/hooks/HookRunner.js +230 -0
package/src/index.js +482 -0
package/src/mcp/MCPAgentRunner.js +112 -0
package/src/mcp/MCPClient.js +186 -0
package/src/mcp/MCPManager.js +412 -0
package/src/models/ModelRouter.js +180 -0
package/src/safety/AuditLog.js +135 -0
package/src/safety/CircuitBreaker.js +126 -0
package/src/safety/FilesystemGuard.js +169 -0
package/src/safety/GitRollback.js +139 -0
package/src/safety/HumanApproval.js +156 -0
package/src/safety/InputSanitizer.js +72 -0
package/src/safety/PermissionGuard.js +83 -0
package/src/safety/Sandbox.js +70 -0
package/src/safety/SecretScanner.js +100 -0
package/src/safety/SecretVault.js +250 -0
package/src/scheduler/Heartbeat.js +115 -0
package/src/scheduler/Scheduler.js +228 -0
package/src/services/models/outputSchema.js +15 -0
package/src/services/openai.js +25 -0
package/src/services/sessions.js +65 -0
package/src/setup/theme.js +110 -0
package/src/setup/wizard.js +788 -0
package/src/skills/SkillLoader.js +168 -0
package/src/storage/TaskStore.js +69 -0
package/src/systemPrompt.js +526 -0
package/src/tenants/TenantContext.js +19 -0
package/src/tenants/TenantManager.js +379 -0
package/src/tools/ToolRegistry.js +141 -0
package/src/tools/applyPatch.js +144 -0
package/src/tools/browserAutomation.js +223 -0
package/src/tools/createDocument.js +265 -0
package/src/tools/cronTool.js +105 -0
package/src/tools/editFile.js +139 -0
package/src/tools/executeCommand.js +123 -0
package/src/tools/glob.js +67 -0
package/src/tools/grep.js +121 -0
package/src/tools/imageAnalysis.js +120 -0
package/src/tools/index.js +173 -0
package/src/tools/listDirectory.js +47 -0
package/src/tools/manageAgents.js +47 -0
package/src/tools/manageMCP.js +159 -0
package/src/tools/memory.js +478 -0
package/src/tools/messageChannel.js +45 -0
package/src/tools/projectTracker.js +259 -0
package/src/tools/readFile.js +52 -0
package/src/tools/screenCapture.js +112 -0
package/src/tools/searchContent.js +76 -0
package/src/tools/searchFiles.js +75 -0
package/src/tools/sendEmail.js +118 -0
package/src/tools/sendFile.js +63 -0
package/src/tools/textToSpeech.js +161 -0
package/src/tools/transcribeAudio.js +82 -0
package/src/tools/useMCP.js +29 -0
package/src/tools/webFetch.js +150 -0
package/src/tools/webSearch.js +134 -0
package/src/tools/writeFile.js +26 -0

package/src/core/AgentLoop.js ADDED Viewed

@@ -0,0 +1,446 @@
+import { generateObject } from "ai";
+import { getModelWithFallback } from "../models/ModelRouter.js";
+import { compactIfNeeded, estimateTokens } from "./Compaction.js";
+import { config } from "../config/default.js";
+import eventBus from "./EventBus.js";
+import outputSchema from "../services/models/outputSchema.js";
+import hookRunner from "../hooks/HookRunner.js";
+import secretScanner from "../safety/SecretScanner.js";
+import sandbox from "../safety/Sandbox.js";
+import circuitBreaker from "../safety/CircuitBreaker.js";
+import permissionGuard from "../safety/PermissionGuard.js";
+import supervisor from "../agents/Supervisor.js";
+import gitRollback from "../safety/GitRollback.js";
+/**
+ * Core agent loop — model-agnostic via Vercel AI SDK.
+ *
+ * Extracted from the original openai.js. This is the brain of the agent:
+ * 1. Send messages to model (any provider)
+ * 2. If model returns tool_call → execute tool → feed result back → loop
+ * 3. If model returns text + finalResponse → return to caller
+ * 4. Compaction when approaching context limit
+ * 5. Repeat detection, max loop safety, stuck agent recovery
+ *
+ * @param {object} options
+ * @param {Array} options.messages - Conversation history
+ * @param {object} options.systemPrompt - System prompt { role, content }
+ * @param {object} options.tools - Tool functions map { name: fn }
+ * @param {string} [options.modelId] - Model to use (e.g. "openai:gpt-4.1-mini")
+ * @param {string} [options.taskId] - Task ID for tracking
+ * @returns {{ text: string, messages: Array, cost: object }}
+ */
+export async function runAgentLoop({
+  messages: msgs,
+  systemPrompt,
+  tools,
+  modelId = null,
+  taskId = null,
+  approvalMode = "auto",   // "auto" | "dangerous-only" | "every-tool"
+  channelMeta = null,      // passed through to HumanApproval so channel can notify user
+  signal = null,           // AbortController.signal — hard-kills the loop mid-call
+  steerQueue = null,       // shared mutable array — push strings here to steer the agent
+  apiKeys = {},            // per-tenant API key overlay — passed through to provider factory
+}) {
+  const selectedModelId = modelId || config.defaultModel;
+  const { model, meta, modelId: resolvedModelId } = getModelWithFallback(selectedModelId, apiKeys);
+  // Build set of known secret values to redact from tool outputs (dynamic — catches tenant keys)
+  const _knownSecrets = new Set([
+    ...Object.values(apiKeys),
+    process.env.OPENAI_API_KEY,
+    process.env.ANTHROPIC_API_KEY,
+    process.env.GOOGLE_AI_API_KEY,
+  ].filter((s) => s && s.length >= 8));
+  function _redactKnownSecrets(text) {
+    let out = text;
+    for (const secret of _knownSecrets) {
+      if (out.includes(secret)) out = out.replaceAll(secret, "[REDACTED:API_KEY]");
+    }
+    return out;
+  }
+  let messages = [systemPrompt, ...msgs];
+  let stepCount = 0;
+  let writeToolUsed = false;  // Track if model actually modified anything
+  let loopCount = 0;
+  let lastToolCall = null;
+  let repeatCount = 0;
+  let totalInputTokens = 0;
+  let totalOutputTokens = 0;
+  let consecutiveErrors = 0;
+  const WRITE_TOOLS = new Set(["writeFile", "editFile", "applyPatch", "executeCommand", "sendEmail", "createDocument", "browserAction", "messageChannel"]);
+  let gitSnapshotDone = false; // Only snapshot once per task
+  const ACTION_WORDS = /\b(fixed|updated|created|added|modified|changed|removed|deleted|wrote|edited|replaced|refactored|implemented|styled|applied)\b/i;
+  console.log(`\n--- AGENT LOOP STARTED ---`);
+  console.log(`Model: ${resolvedModelId}`);
+  console.log(`User message: "${msgs[msgs.length - 1]?.content?.slice(0, 120)}"`);
+  console.log(`Conversation history: ${msgs.length} message(s)`);
+  while (true) {
+    loopCount++;
+    // ── Break point 1: AbortController signal (hard kill, works mid-API-call) ──
+    if (signal?.aborted) {
+      console.log(`[AgentLoop] Task ${taskId?.slice(0, 8)} aborted via AbortController.`);
+      return {
+        text: "Agent was stopped by the supervisor.",
+        messages: messages.slice(1),
+        cost: { inputTokens: totalInputTokens, outputTokens: totalOutputTokens, estimatedCost: 0, modelCalls: loopCount, model: resolvedModelId },
+      };
+    }
+    // ── Break point 2: Supervisor kill flag (checked each iteration) ──────────
+    if (supervisor.isKilled(taskId)) {
+      console.log(`[AgentLoop] Task ${taskId?.slice(0, 8)} was killed by Supervisor. Stopping.`);
+      return {
+        text: "Task was stopped by the safety supervisor due to excessive tool usage or a dangerous pattern.",
+        messages: messages.slice(1),
+        cost: { inputTokens: totalInputTokens, outputTokens: totalOutputTokens, estimatedCost: 0, modelCalls: loopCount, model: resolvedModelId },
+      };
+    }
+    // ── Steering: drain steerQueue between tool calls ────────────────────────
+    // Items can be plain strings (supervisor/parent instructions) or
+    // objects { type: "user", content } for live follow-up messages injected
+    // from the same session while this loop is mid-flight.
+    if (steerQueue?.length > 0) {
+      while (steerQueue.length > 0) {
+        const item = steerQueue.shift();
+        if (item && typeof item === "object" && item.type === "user") {
+          // User sent a follow-up mid-task — inject as a natural user turn
+          console.log(`[AgentLoop] User follow-up injected: "${item.content.slice(0, 80)}"`);
+          messages.push({ role: "user", content: item.content });
+        } else {
+          const text = typeof item === "string" ? item : JSON.stringify(item);
+          console.log(`[AgentLoop] Steering instruction received: "${text.slice(0, 80)}"`);
+          messages.push({ role: "user", content: `[Supervisor instruction]: ${text}` });
+        }
+      }
+    }
+    if (loopCount > config.maxLoops) {
+      console.log(`[WARN] Hit max loop limit (${config.maxLoops}). Forcing agent to stop.`);
+      messages.push({
+        role: "user",
+        content: `You have used ${config.maxLoops} iterations. You must stop now. Summarize what you have done so far. Set type to "text", finalResponse to true, and put your summary in text_content.`,
+      });
+    }
+    // Compaction check before model call
+    messages = await compactIfNeeded(messages, meta, taskId);
+    console.log(`\n[Loop ${loopCount}] Sending ${messages.length} messages (~${estimateTokens(messages)} tokens) to ${resolvedModelId}...`);
+    const startTime = Date.now();
+    try {
+      const response = await generateObject({
+        model,
+        schema: outputSchema,
+        messages,
+        maxTokens: 4096,
+        abortSignal: signal || undefined,
+      });
+      const elapsed = Date.now() - startTime;
+      consecutiveErrors = 0; // Reset on success
+      // Track token usage
+      if (response.usage) {
+        totalInputTokens += response.usage.promptTokens || 0;
+        totalOutputTokens += response.usage.completionTokens || 0;
+      }
+      eventBus.emitEvent("model:called", {
+        modelId: resolvedModelId,
+        loopCount,
+        elapsed,
+        inputTokens: response.usage?.promptTokens || 0,
+        outputTokens: response.usage?.completionTokens || 0,
+      });
+      const parsedOutput = response.object;
+      console.log(
+        `[Loop ${loopCount}] Model responded in ${elapsed}ms | type=${parsedOutput.type} | final=${parsedOutput.finalResponse}`
+      );
+      // --- Tool call handling ---
+      if (parsedOutput.type === "tool_call" && parsedOutput.tool_call) {
+        // Save the model's tool call as an assistant message so the conversation is properly structured
+        messages.push({ role: "assistant", content: JSON.stringify(parsedOutput) });
+        stepCount++;
+        const { tool_name, params } = parsedOutput.tool_call;
+        // Repeat detection
+        const currentCall = JSON.stringify({ tool_name, params });
+        if (currentCall === lastToolCall) {
+          repeatCount++;
+          console.log(`[WARN] Same tool call repeated ${repeatCount + 1} times in a row`);
+          if (repeatCount >= 2) {
+            console.log(`[WARN] Agent stuck repeating "${tool_name}". Forcing it to move on.`);
+            messages.push({
+              role: "user",
+              content: `You are calling ${tool_name} with the same params repeatedly. This is not working. Try a different approach or give the user your final answer. Set type to "text" and finalResponse to true.`,
+            });
+            lastToolCall = null;
+            repeatCount = 0;
+            continue;
+          }
+        } else {
+          repeatCount = 0;
+        }
+        lastToolCall = currentCall;
+        console.log(`[Step ${stepCount}] Tool: ${tool_name}`);
+        console.log(`[Step ${stepCount}] Params: ${JSON.stringify(params)}`);
+        eventBus.emitEvent("tool:before", { tool_name, params, stepCount, taskId });
+        // Permission guard check
+        const permCheck = permissionGuard.check(tool_name, params);
+        if (!permCheck.allowed) {
+          console.log(`[Step ${stepCount}] BLOCKED by PermissionGuard: ${permCheck.reason}`);
+          eventBus.emitEvent("audit:permission_denied", { tool_name, reason: permCheck.reason, taskId });
+          messages.push({
+            role: "user",
+            content: JSON.stringify({ tool_name, params, output: permCheck.reason }),
+          });
+          continue;
+        }
+        // Circuit breaker check
+        if (circuitBreaker.isToolDisabled(tool_name)) {
+          console.log(`[Step ${stepCount}] Tool "${tool_name}" temporarily disabled by circuit breaker`);
+          messages.push({
+            role: "user",
+            content: JSON.stringify({
+              tool_name, params,
+              output: `Tool "${tool_name}" is temporarily disabled due to repeated failures. Try a different approach.`,
+            }),
+          });
+          continue;
+        }
+        // Sandbox check for executeCommand
+        if (tool_name === "executeCommand" && params[0]) {
+          const sandboxResult = sandbox.check(params[0]);
+          if (!sandboxResult.safe) {
+            console.log(`[Step ${stepCount}] BLOCKED by sandbox: ${sandboxResult.reason}`);
+            eventBus.emitEvent("audit:sandbox_blocked", { command: params[0], reason: sandboxResult.reason, taskId });
+            messages.push({
+              role: "user",
+              content: JSON.stringify({
+                tool_name, params,
+                output: `${sandboxResult.reason}. This command is not allowed for safety reasons.`,
+              }),
+            });
+            continue;
+          }
+        }
+        // Run PreToolUse hooks
+        const hookResult = await hookRunner.preToolUse(tool_name, params, taskId);
+        if (hookResult.decision === "block") {
+          console.log(`[Step ${stepCount}] BLOCKED by hook: ${hookResult.reason}`);
+          eventBus.emitEvent("audit:hook_blocked", { tool_name, reason: hookResult.reason, taskId });
+          messages.push({
+            role: "user",
+            content: JSON.stringify({
+              tool_name, params,
+              output: `Tool blocked by safety hook: ${hookResult.reason}. Try a different approach.`,
+            }),
+          });
+          continue;
+        }
+        // Git snapshot — before the first write tool in this task
+        if (!gitSnapshotDone && WRITE_TOOLS.has(tool_name)) {
+          gitRollback.snapshot(taskId);
+          gitSnapshotDone = true;
+        }
+        if (tools[tool_name]) {
+          try {
+            const toolStart = Date.now();
+            const toolOutput = await Promise.resolve(tools[tool_name](...params));
+            const toolElapsed = Date.now() - toolStart;
+            const outputStr = typeof toolOutput === "string" ? toolOutput : JSON.stringify(toolOutput);
+            const preview = outputStr.slice(0, 300) + (outputStr.length > 300 ? "..." : "");
+            // Track if a write tool was successfully used
+            if (WRITE_TOOLS.has(tool_name)) {
+              writeToolUsed = true;
+            }
+            console.log(`[Step ${stepCount}] Done in ${toolElapsed}ms`);
+            console.log(`[Step ${stepCount}] Output: ${preview}`);
+            eventBus.emitEvent("tool:after", {
+              tool_name,
+              params,
+              stepCount,
+              taskId,
+              duration: toolElapsed,
+              outputLength: outputStr.length,
+            });
+            // Run PostToolUse hooks
+            await hookRunner.postToolUse(tool_name, params, outputStr, taskId);
+            // Scan output for secrets and redact (double layer: static patterns + dynamic tenant keys)
+            const safeOutput = _redactKnownSecrets(secretScanner.redactOutput(outputStr));
+            const secretsFound = (outputStr.match(/\[REDACTED\]/g) || []).length - (safeOutput.match(/\[REDACTED\]/g) || []).length;
+            if (safeOutput !== outputStr) {
+              eventBus.emitEvent("audit:secret_detected", { tool_name, taskId, count: Math.max(1, secretsFound) });
+            }
+            // Record success for circuit breaker
+            circuitBreaker.recordSuccess(taskId);
+            messages.push({
+              role: "user",
+              content: JSON.stringify({ tool_name, params, output: safeOutput }),
+            });
+          } catch (error) {
+            console.log(`[Step ${stepCount}] FAILED: ${error.message}`);
+            // Record failure for circuit breaker
+            circuitBreaker.recordToolFailure(tool_name);
+            eventBus.emitEvent("tool:after", {
+              tool_name,
+              params,
+              stepCount,
+              taskId,
+              error: error.message,
+            });
+            messages.push({
+              role: "user",
+              content: JSON.stringify({
+                tool_name,
+                params,
+                output: `Error executing tool: ${error.message}`,
+              }),
+            });
+          }
+        } else {
+          console.log(`[Step ${stepCount}] Unknown tool: ${tool_name} — skipping`);
+          messages.push({
+            role: "user",
+            content: JSON.stringify({
+              tool_name,
+              params,
+              output: `Unknown tool: ${tool_name}. Available tools: ${Object.keys(tools).join(", ")}`,
+            }),
+          });
+        }
+        continue;
+      }
+      // --- Final response handling ---
+      if (parsedOutput.finalResponse || parsedOutput.type === "text") {
+        if (!parsedOutput.text_content) {
+          console.log(`[Loop ${loopCount}] Model signaled done but text_content is null — asking for summary`);
+          messages.push({
+            role: "user",
+            content:
+              "Provide a text summary of what you did. Set type to 'text', finalResponse to true, and text_content to your summary.",
+          });
+          continue;
+        }
+        // --- Lazy model safeguard ---
+        // SAFEGUARD 1: Model claimed done but used ZERO tools
+        // If the user's message is a real request (not just "ok"/"yes"), force tool use.
+        if (stepCount === 0 && loopCount <= 2) {
+          const lastUserMsg = msgs[msgs.length - 1]?.content?.toLowerCase() || "";
+          const isAck = /^(ok|okay|yes|yeah|sure|thanks|thank you|no|nah|k|yep|yup|got it|cool|nice|great|good|alright|👍)\.?$/i.test(lastUserMsg.trim());
+          if (!isAck && lastUserMsg.length > 5) {
+            console.log(`[Loop ${loopCount}] LAZY MODEL DETECTED — claimed done but used 0 tools. Forcing tool use.`);
+            messages.push({
+              role: "user",
+              content: `You responded without using any tools. You MUST actually use tools (readFile, editFile, writeFile, executeCommand, etc.) to complete the task. Do NOT claim you fixed or changed something without actually doing it. Use your tools NOW to fulfill the request.`,
+            });
+            continue;
+          }
+        }
+        // SAFEGUARD 2: Model used only READ tools but claims it modified/fixed something
+        // If the response contains action words but no write tool was ever called, push back.
+        if (!writeToolUsed && stepCount > 0 && loopCount <= 4 && ACTION_WORDS.test(parsedOutput.text_content)) {
+          console.log(`[Loop ${loopCount}] PHANTOM WRITE DETECTED — model claims "${parsedOutput.text_content.slice(0, 80)}..." but only used read tools. Forcing actual writes.`);
+          messages.push({
+            role: "user",
+            content: `You claim to have made changes but you only used read tools — you never called writeFile or editFile to actually modify any file. The files are UNCHANGED. You must use writeFile or editFile to actually make the changes. Do it now.`,
+          });
+          continue;
+        }
+        const cost = {
+          inputTokens: totalInputTokens,
+          outputTokens: totalOutputTokens,
+          estimatedCost:
+            (totalInputTokens / 1000) * meta.costPer1kInput +
+            (totalOutputTokens / 1000) * meta.costPer1kOutput,
+          modelCalls: loopCount,
+          model: resolvedModelId,
+        };
+        console.log(`\n--- AGENT LOOP FINISHED ---`);
+        console.log(`Stats: ${loopCount} loops | ${stepCount} tool calls | ~$${cost.estimatedCost.toFixed(4)}`);
+        console.log(
+          `Response: "${parsedOutput.text_content.slice(0, 150)}${parsedOutput.text_content.length > 150 ? "..." : ""}"`
+        );
+        // Add assistant's final response to conversation history
+        messages.push({ role: "assistant", content: parsedOutput.text_content });
+        const conversationMessages = messages.slice(1);
+        return { text: parsedOutput.text_content, messages: conversationMessages, cost };
+      }
+    } catch (error) {
+      // Abort signal fires as an error — exit cleanly
+      if (signal?.aborted || error.name === "AbortError") {
+        console.log(`[Loop ${loopCount}] Aborted mid-call.`);
+        return {
+          text: "Agent was stopped by the supervisor.",
+          messages: messages.slice(1),
+          cost: { inputTokens: totalInputTokens, outputTokens: totalOutputTokens, estimatedCost: 0, modelCalls: loopCount, model: resolvedModelId },
+        };
+      }
+      consecutiveErrors++;
+      console.log(`[Loop ${loopCount}] Model call failed (${consecutiveErrors}/3): ${error.message}`);
+      // Give up after 3 consecutive failures
+      if (consecutiveErrors >= 3) {
+        console.log(`[FATAL] 3 consecutive model failures. Stopping.`);
+        return {
+          text: `I encountered an error while processing your request: ${error.message}`,
+          messages: messages.slice(1),
+          cost: {
+            inputTokens: totalInputTokens,
+            outputTokens: totalOutputTokens,
+            estimatedCost: 0,
+            modelCalls: loopCount,
+            model: resolvedModelId,
+          },
+        };
+      }
+      // Retry with a user-role nudge (compatible with all providers)
+      messages.push({
+        role: "user",
+        content: `[System: previous call failed: ${error.message}] Please provide your final answer. Set type to "text" and finalResponse to true.`,
+      });
+      continue;
+    }
+  }
+}

package/src/core/Compaction.js ADDED Viewed

@@ -0,0 +1,143 @@
+import { generateText } from "ai";
+import { getCheapModel } from "../models/ModelRouter.js";
+import { writeFileSync, mkdirSync } from "fs";
+import { config } from "../config/default.js";
+import eventBus from "./EventBus.js";
+/**
+ * Context compaction system.
+ *
+ * When conversation history approaches the model's context window:
+ * 1. Estimate token count
+ * 2. If over threshold → summarize older messages
+ * 3. Prune verbose tool outputs
+ * 4. Persist large outputs to disk
+ * 5. Continue with compressed context
+ */
+/**
+ * Rough token estimate: ~4 chars per token for English text.
+ */
+export function estimateTokens(messages) {
+  let total = 0;
+  for (const msg of messages) {
+    const content = typeof msg.content === "string" ? msg.content : JSON.stringify(msg.content);
+    total += Math.ceil(content.length / 4);
+  }
+  return total;
+}
+/**
+ * Prune a single tool output — truncate if too long.
+ */
+function pruneToolOutput(content, maxChars = 5000) {
+  if (typeof content !== "string") content = JSON.stringify(content);
+  if (content.length <= maxChars) return content;
+  const headSize = Math.floor(maxChars * 0.6);
+  const tailSize = Math.floor(maxChars * 0.3);
+  return (
+    content.slice(0, headSize) +
+    `\n\n[... truncated ${content.length - headSize - tailSize} chars ...]\n\n` +
+    content.slice(-tailSize)
+  );
+}
+/**
+ * Persist a large tool output to disk and return a reference.
+ */
+function persistLargeOutput(content, taskId, stepIndex) {
+  const dir = `${config.dataDir}/tool-outputs`;
+  mkdirSync(dir, { recursive: true });
+  const filename = `${taskId || "unknown"}-step${stepIndex}-${Date.now()}.txt`;
+  const filePath = `${dir}/${filename}`;
+  writeFileSync(filePath, content);
+  return `[Output saved to disk: ${filePath} — ${content.length} chars]`;
+}
+/**
+ * Check if compaction is needed and perform it.
+ *
+ * @param {Array} messages - Current message history
+ * @param {object} modelMeta - Model metadata (from models.js) with compactAt threshold
+ * @param {string} taskId - Current task ID for file persistence
+ * @returns {Array} Possibly compacted messages
+ */
+export async function compactIfNeeded(messages, modelMeta, taskId = null) {
+  const tokenCount = estimateTokens(messages);
+  if (tokenCount < modelMeta.compactAt) {
+    return messages;
+  }
+  console.log(
+    `[Compaction] Triggered: ~${tokenCount} tokens exceeds threshold ${modelMeta.compactAt}`
+  );
+  eventBus.emitEvent("compact:triggered", { tokenCount, threshold: modelMeta.compactAt });
+  // Step 1: Identify protected messages (system prompt + last 3 exchanges)
+  const systemMsg = messages[0]; // always protect system prompt
+  const recentCount = 6; // last 3 user+assistant pairs
+  const recentMessages = messages.slice(-recentCount);
+  const oldMessages = messages.slice(1, -recentCount);
+  if (oldMessages.length === 0) {
+    // Nothing to compact — all messages are recent
+    return messages;
+  }
+  // Step 2: Prune verbose tool outputs in old messages
+  const prunedOld = oldMessages.map((msg, i) => {
+    if (msg.role === "developer" || msg.role === "tool") {
+      const content = typeof msg.content === "string" ? msg.content : JSON.stringify(msg.content);
+      if (content.length > 50000) {
+        return { ...msg, content: persistLargeOutput(content, taskId, i) };
+      }
+      if (content.length > 5000) {
+        return { ...msg, content: pruneToolOutput(content) };
+      }
+    }
+    return msg;
+  });
+  // Step 3: Summarize old messages using a cheap model
+  try {
+    const { model } = getCheapModel();
+    const summaryPrompt = `Summarize the following conversation history concisely. Preserve:
+- Key decisions made
+- File paths mentioned and their purpose
+- Task progress and what was accomplished
+- Any errors encountered and how they were resolved
+- User preferences or instructions
+Conversation to summarize:
+${prunedOld.map((m) => `[${m.role}]: ${typeof m.content === "string" ? m.content.slice(0, 2000) : JSON.stringify(m.content).slice(0, 2000)}`).join("\n")}`;
+    const { text: summary } = await generateText({
+      model,
+      messages: [{ role: "user", content: summaryPrompt }],
+      maxTokens: 1000,
+    });
+    const compactedMessages = [
+      systemMsg,
+      {
+        role: "developer",
+        content: `<conversation-summary>\nThe following is a summary of earlier conversation that was compacted to save context space:\n\n${summary}\n</conversation-summary>`,
+      },
+      ...recentMessages,
+    ];
+    const newTokenCount = estimateTokens(compactedMessages);
+    console.log(
+      `[Compaction] Done: ${tokenCount} → ~${newTokenCount} tokens (saved ~${tokenCount - newTokenCount})`
+    );
+    return compactedMessages;
+  } catch (error) {
+    console.log(`[Compaction] Summarization failed: ${error.message}. Falling back to pruning only.`);
+    // Fallback: just prune tool outputs without summarization
+    return [systemMsg, ...prunedOld, ...recentMessages];
+  }
+}