npm - tsunami-code - Versions diffs - 2.8.0 → 3.0.0 - Mend

tsunami-code 2.8.0 → 3.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/index.js CHANGED Viewed

@@ -4,7 +4,8 @@ import chalk from 'chalk';
 import { existsSync, readFileSync, writeFileSync, mkdirSync } from 'fs';
 import { join } from 'path';
 import os from 'os';
-import { agentLoop, quickCompletion, setModel, getModel } from './lib/loop.js';
+import { agentLoop, quickCompletion, setModel, getModel, tokenStats } from './lib/loop.js';
+import { injectServerContext } from './lib/tools.js';
 import { buildSystemPrompt } from './lib/prompt.js';
 import { runPreflight, checkServer } from './lib/preflight.js';
 import { setSession, undo, undoStackSize } from './lib/tools.js';
@@ -20,7 +21,7 @@ import {
   getSessionContext
 } from './lib/memory.js';
-const VERSION = '2.8.0';
+const VERSION = '3.0.0';
 const CONFIG_DIR = join(os.homedir(), '.tsunami-code');
 const CONFIG_FILE = join(CONFIG_DIR, 'config.json');
 const DEFAULT_SERVER = 'https://radiometric-reita-amuck.ngrok-free.dev';
@@ -131,7 +132,7 @@ if (setServerIdx !== -1 && argv[setServerIdx + 1]) {
 // ── Confirm Callback (dangerous command prompt) ─────────────────────────────
 function makeConfirmCallback(rl) {
-  return async (cmd) => {
+  const cb = async (cmd) => {
     return new Promise((resolve) => {
       rl.pause();
       process.stdout.write(`\n  ${yellow('⚠  Dangerous:')} ${dim(cmd.slice(0, 120))}\n`);
@@ -145,6 +146,20 @@ function makeConfirmCallback(rl) {
       process.stdin.once('data', handler);
     });
   };
+  cb._askUser = (question, resolve) => {
+    rl.pause();
+    process.stdout.write(`\n  ${cyan('?')} ${question}\n  ${dim('> ')}`);
+    const handler = (data) => {
+      process.stdin.removeListener('data', handler);
+      rl.resume();
+      process.stdout.write('\n');
+      resolve(data.toString().trim());
+    };
+    process.stdin.once('data', handler);
+  };
+  return cb;
 }
 // ── Main ──────────────────────────────────────────────────────────────────────
@@ -158,8 +173,31 @@ async function run() {
   initProjectMemory(cwd);
   setSession({ sessionDir, cwd });
+  // Inject server context into AgentTool
+  injectServerContext(serverUrl, buildSystemPrompt());
   printBanner(serverUrl);
+  // Persistent history — load previous commands
+  const HISTORY_FILE = join(CONFIG_DIR, 'history.jsonl');
+  function appendHistory(line) {
+    try {
+      const entry = JSON.stringify({ cmd: line, ts: Date.now(), cwd }) + '\n';
+      import('fs').then(({ appendFileSync }) => { try { appendFileSync(HISTORY_FILE, entry, 'utf8'); } catch {} });
+    } catch {}
+  }
+  function loadHistory() {
+    try {
+      if (!existsSync(HISTORY_FILE)) return [];
+      return readFileSync(HISTORY_FILE, 'utf8')
+        .trim().split('\n').filter(Boolean)
+        .map(l => { try { return JSON.parse(l).cmd; } catch { return null; } })
+        .filter(Boolean).reverse().slice(0, 200);
+    } catch { return []; }
+  }
+  const historyEntries = loadHistory();
+  let historyIdx = -1;
   // Preflight checks
   process.stdout.write(dim('  Checking server connection...'));
   const { errors, warnings } = await runPreflight(serverUrl);
@@ -342,10 +380,28 @@ async function run() {
     console.log(red(`  Unknown memory subcommand: ${sub}\n  Try: /memory, /memory files, /memory view <file>, /memory clear\n`));
   }
+  // Frustration detection — from leaked userPromptKeywords.ts pattern
+  const FRUSTRATION_PATTERNS = [
+    /\b(wtf|fuck|shit|damn|idiot|stupid|useless|broken|wrong|garbage|trash|terrible|awful|hate)\b/i,
+    /\b(not working|still broken|still wrong|same error|again|ugh|argh)\b/i,
+    /!{2,}/,
+    /\b(why (would|did|is|are|does|do) you|you (keep|always|never|can't|cannot|won't|don't))\b/i,
+    /\b(i (said|told|asked)|stop|listen|pay attention)\b/i
+  ];
+  function detectFrustration(text) {
+    return FRUSTRATION_PATTERNS.some(p => p.test(text));
+  }
   rl.on('line', async (input) => {
     const line = input.trim();
     if (!line) { rl.prompt(); return; }
+    // Append to persistent history
+    if (!line.startsWith('/')) {
+      appendHistory(line);
+      historyIdx = -1;
+    }
     if (line.startsWith('/')) {
       const parts = line.slice(1).split(' ');
       const cmd = parts[0].toLowerCase();
@@ -370,6 +426,7 @@ async function run() {
               ['/status',          'Show context size and server'],
               ['/server <url>',    'Change model server URL'],
               ['/model [name]',    'Show or change active model (default: local)'],
+              ['/history',         'Show recent command history'],
               ['/exit',            'Exit'],
             ];
             for (const [c, desc] of cmds) {
@@ -416,13 +473,22 @@ async function run() {
           console.log(dim(`  CWD     : ${cwd}\n`));
           break;
         }
-        case 'cost':
-          console.log(blue('\n  Session Token Estimate'));
-          console.log(dim(`  Input  : ~${_inputTokens.toLocaleString()}`));
-          console.log(dim(`  Output : ~${_outputTokens.toLocaleString()}`));
-          console.log(dim(`  Total  : ~${(_inputTokens + _outputTokens).toLocaleString()}`));
-          console.log(dim('  (Estimates only)\n'));
+        case 'cost': {
+          const hasReal = tokenStats.requests > 0;
+          console.log(blue('\n  Session Token Usage'));
+          if (hasReal) {
+            console.log(dim(`  Input  : ${tokenStats.input.toLocaleString()} tokens (actual)`));
+            console.log(dim(`  Output : ${tokenStats.output.toLocaleString()} tokens (actual)`));
+            console.log(dim(`  Total  : ${(tokenStats.input + tokenStats.output).toLocaleString()} tokens`));
+            console.log(dim(`  Requests: ${tokenStats.requests}`));
+          } else {
+            console.log(dim(`  Input  : ~${_inputTokens.toLocaleString()} (estimated)`));
+            console.log(dim(`  Output : ~${_outputTokens.toLocaleString()} (estimated)`));
+            console.log(dim(`  Total  : ~${(_inputTokens + _outputTokens).toLocaleString()} (estimated)`));
+          }
+          console.log();
           break;
+        }
         case 'clear':
           resetSession();
           console.log(green('  Session cleared.\n'));
@@ -449,6 +515,14 @@ async function run() {
         case 'memory':
           await handleMemoryCommand(rest);
           break;
+        case 'history': {
+          const recent = historyEntries.slice(0, 20);
+          if (recent.length === 0) { console.log(dim('  No history yet.\n')); break; }
+          console.log(blue(`\n  Recent commands (${recent.length}):`));
+          recent.forEach((h, i) => console.log(dim(`  ${String(i + 1).padStart(2)}  ${h.slice(0, 100)}`)));
+          console.log();
+          break;
+        }
         case 'exit': case 'quit':
           gracefulExit(0);
           return;
@@ -465,6 +539,11 @@ async function run() {
       userContent = `[Previous session summary]\n${lastSessionSummary}\n\n---\n\n${line}`;
     }
+    // Frustration injection — tell the model to acknowledge and course-correct
+    if (detectFrustration(line)) {
+      userContent += '\n\n[system: User appears frustrated. Acknowledge the issue directly, do not repeat the same approach. Be concise and action-focused.]';
+    }
     const fullMessages = [
       { role: 'system', content: systemPrompt },
       ...messages,

package/lib/loop.js CHANGED Viewed

@@ -1,5 +1,5 @@
 import fetch from 'node-fetch';
-import { ALL_TOOLS } from './tools.js';
+import { ALL_TOOLS, injectAgentLoop, injectServerContext } from './tools.js';
 import {
   assembleContext,
   extractFilePaths,
@@ -29,6 +29,9 @@ function isDangerous(cmd) {
 // Skip waitForServer after first successful connection
 let _serverVerified = false;
+// Real token tracking from API responses
+export const tokenStats = { input: 0, output: 0, requests: 0 };
 // Current model identifier — changeable at runtime via /model command
 let _currentModel = 'local';
 export function setModel(model) { _currentModel = model; }
@@ -234,6 +237,12 @@ async function streamCompletion(serverUrl, messages, onToken, memoryContext = ''
         fullContent += token;
         onToken(token);
       }
+      // Capture real token counts from usage field (sent on final chunk by llama.cpp)
+      if (parsed.usage) {
+        tokenStats.input += parsed.usage.prompt_tokens || 0;
+        tokenStats.output += parsed.usage.completion_tokens || 0;
+        tokenStats.requests++;
+      }
     }
   }
@@ -278,6 +287,12 @@ export async function quickCompletion(serverUrl, systemPrompt, userMessage) {
   }
 }
+// Self-register into tools.js so AgentTool can call back into us
+// (done here at module load time to avoid circular import at parse time)
+import('./tools.js').then(m => {
+  m.injectAgentLoop(agentLoop);
+}).catch(() => {});
 export async function agentLoop(serverUrl, messages, onToken, onToolCall, sessionInfo = null, confirmCallback = null, maxIterations = 15) {
   const lastUserMsg = [...messages].reverse().find(m => m.role === 'user');
   const currentTask = typeof lastUserMsg?.content === 'string' ? lastUserMsg.content : '';
@@ -317,6 +332,20 @@ export async function agentLoop(serverUrl, messages, onToken, onToolCall, sessio
         continue;
       }
+      // AskUser: intercept and surface the question to the user
+      if (tc.name === 'AskUser' && confirmCallback) {
+        const parsed = typeof tc.arguments === 'string' ? JSON.parse(tc.arguments) : tc.arguments;
+        const normalized = normalizeArgs(parsed);
+        onToolCall(tc.name, typeof tc.arguments === 'string' ? tc.arguments : JSON.stringify(tc.arguments));
+        // Reuse confirmCallback channel but pass question back as answer
+        const answer = await new Promise(resolve => confirmCallback._askUser
+          ? confirmCallback._askUser(normalized.question, resolve)
+          : resolve('[No answer provided]')
+        );
+        results.push(`[AskUser result]\nUser answered: ${answer}`);
+        continue;
+      }
       // Dangerous command confirmation
       if (tc.name === 'Bash' && confirmCallback) {
         const parsed = typeof tc.arguments === 'string' ? JSON.parse(tc.arguments) : tc.arguments;
@@ -333,7 +362,26 @@ export async function agentLoop(serverUrl, messages, onToken, onToolCall, sessio
       onToolCall(tc.name, typeof tc.arguments === 'string' ? tc.arguments : JSON.stringify(tc.arguments));
       const result = await runTool(tc.name, tc.arguments, sessionInfo, sessionFiles);
-      results.push(`[${tc.name} result]\n${String(result).slice(0, 8000)}`);
+      const resultStr = String(result);
+      // Handle Snip signal — surgically remove message indices from context
+      if (tc.name === 'Snip') {
+        try {
+          const sig = JSON.parse(resultStr);
+          if (sig.__snip__ && Array.isArray(sig.indices)) {
+            const toRemove = new Set(sig.indices.map(Number));
+            // messages[0] is system prompt, indices are 1-based user/assistant turns
+            const kept = messages.filter((_, i) => i === 0 || !toRemove.has(i - 1));
+            const removed = messages.length - kept.length;
+            messages.length = 0;
+            kept.forEach(m => messages.push(m));
+            results.push(`[Snip result]\nRemoved ${removed} messages from context. Reason: ${sig.reason}`);
+            continue;
+          }
+        } catch {}
+      }
+      results.push(`[${tc.name} result]\n${resultStr.slice(0, 8000)}`);
     }
     messages.push({

package/lib/prompt.js CHANGED Viewed

@@ -1,6 +1,21 @@
 import { existsSync, readFileSync } from 'fs';
 import { join } from 'path';
 import os from 'os';
+import { execSync } from 'child_process';
+function getGitContext() {
+  try {
+    const branch = execSync('git rev-parse --abbrev-ref HEAD', { stdio: ['ignore', 'pipe', 'ignore'] }).toString().trim();
+    const status = execSync('git status --short', { stdio: ['ignore', 'pipe', 'ignore'] }).toString().trim();
+    const log = execSync('git log --oneline -5', { stdio: ['ignore', 'pipe', 'ignore'] }).toString().trim();
+    const parts = [`Branch: ${branch}`];
+    if (status) parts.push(`Changed files:\n${status}`);
+    if (log) parts.push(`Recent commits:\n${log}`);
+    return `\n\n<git>\n${parts.join('\n\n')}\n</git>`;
+  } catch {
+    return '';
+  }
+}
 function loadContextFile() {
   const locations = [
@@ -23,6 +38,8 @@ export function buildSystemPrompt(memoryContext = '') {
   const cwd = process.cwd();
   const context = loadContextFile();
+  const gitContext = getGitContext();
   return `You are an expert software engineer and technical assistant operating as a CLI agent. You think deeply before acting, trace data flow before changing code, and verify your work.
 To use a tool, output ONLY this format — nothing else before or after the tool call block:
@@ -38,7 +55,7 @@ Available tools: Bash, Read, Write, Edit, Glob, Grep, Note, Checkpoint. Use them
 - Platform: ${process.platform}
 - Shell: ${process.platform === 'win32' ? 'cmd/powershell' : 'bash'}
 - Date: ${new Date().toISOString().split('T')[0]}
-</environment>
+</environment>${gitContext}
 <tools>
 - **Bash**: Run shell commands. Never use for grep/find/cat — use dedicated tools.
@@ -49,6 +66,13 @@ Available tools: Bash, Read, Write, Edit, Glob, Grep, Note, Checkpoint. Use them
 - **Grep**: Search file contents by regex. Always use instead of grep in Bash.
 - **Note**: Save a permanent discovery to project memory (.tsunami/). Use liberally for traps, patterns, architectural decisions.
 - **Checkpoint**: Save current task progress to session memory so work is resumable if the session ends.
+- **WebFetch**: Fetch any URL and get the page content as text. Use for docs, GitHub files, APIs.
+- **WebSearch**: Search the web via DuckDuckGo. Returns titles, URLs, snippets. Follow up with WebFetch.
+- **TodoWrite**: Manage a persistent task list (add/complete/delete/list). Use for any multi-step task.
+- **AskUser**: Ask the user a clarifying question when genuinely blocked. Use sparingly.
+- **Agent**: Spawn a sub-agent to handle an independent task. Call multiple times in one response for parallel execution.
+- **Snip**: Surgically remove specific messages from context to free space without losing everything.
+- **Brief**: Write a working-memory note to yourself. Injected into next turn — ensures nothing is forgotten on long tasks.
 </tools>
 <reasoning_protocol>

package/lib/tools.js CHANGED Viewed

@@ -4,6 +4,7 @@ import { glob } from 'glob';
 import { promisify } from 'util';
 import { getRgPath } from './preflight.js';
 import { addFileNote, updateContext, appendDecision } from './memory.js';
+import fetch from 'node-fetch';
 const execAsync = promisify(exec);
@@ -324,4 +325,327 @@ EXAMPLE:
   }
 };
-export const ALL_TOOLS = [BashTool, ReadTool, WriteTool, EditTool, GlobTool, GrepTool, NoteTool, CheckpointTool];
+// ── WEB FETCH ─────────────────────────────────────────────────────────────────
+export const WebFetchTool = {
+  name: 'WebFetch',
+  description: `Fetches content from a URL and returns it as text. Use for reading documentation, API references, GitHub files, or any web resource needed to complete a task.
+- Returns page content as plain text (HTML stripped)
+- Max ~50KB returned; large pages are truncated
+- Do not use for downloading binaries`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      url: { type: 'string', description: 'The URL to fetch' },
+      prompt: { type: 'string', description: 'What to extract or summarize from the page (optional — returns raw text if omitted)' }
+    },
+    required: ['url']
+  },
+  async run({ url, prompt: _prompt }) {
+    try {
+      const controller = new AbortController();
+      const timer = setTimeout(() => controller.abort(), 15000);
+      const res = await fetch(url, {
+        signal: controller.signal,
+        headers: { 'User-Agent': 'Mozilla/5.0 (compatible; TsunamiCode/2.9)' }
+      });
+      clearTimeout(timer);
+      if (!res.ok) return `Error: HTTP ${res.status} ${res.statusText}`;
+      const raw = await res.text();
+      // Strip HTML tags, collapse whitespace
+      const text = raw
+        .replace(/<script[\s\S]*?<\/script>/gi, '')
+        .replace(/<style[\s\S]*?<\/style>/gi, '')
+        .replace(/<[^>]+>/g, ' ')
+        .replace(/&nbsp;/g, ' ')
+        .replace(/&amp;/g, '&')
+        .replace(/&lt;/g, '<')
+        .replace(/&gt;/g, '>')
+        .replace(/&quot;/g, '"')
+        .replace(/\s{3,}/g, '\n\n')
+        .trim();
+      return text.slice(0, 50000) + (text.length > 50000 ? '\n\n[truncated]' : '');
+    } catch (e) {
+      if (e.name === 'AbortError') return 'Error: Request timed out after 15s';
+      return `Error fetching URL: ${e.message}`;
+    }
+  }
+};
+// ── TODO WRITE ────────────────────────────────────────────────────────────────
+// In-memory todo list — persists for the session, visible to the model
+const _todos = [];
+let _todoId = 0;
+export const TodoWriteTool = {
+  name: 'TodoWrite',
+  description: `Manage a persistent task list for the current session. Use this to track multi-step work so nothing gets lost.
+Operations:
+- add: Add a new todo item
+- complete: Mark a todo as done (by id)
+- delete: Remove a todo (by id)
+- list: Show all todos (also happens automatically)
+WHEN TO USE:
+- Any task with 3+ steps — create the list upfront
+- After completing a step — mark it done immediately
+- When starting work on a step — mark it in_progress
+The list is shown to the user after every update.`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      op: { type: 'string', enum: ['add', 'complete', 'delete', 'list'], description: 'Operation to perform' },
+      text: { type: 'string', description: 'Todo text (for add)' },
+      id: { type: 'number', description: 'Todo ID (for complete/delete)' },
+      status: { type: 'string', enum: ['pending', 'in_progress', 'done'], description: 'Status for complete op (default: done)' }
+    },
+    required: ['op']
+  },
+  async run({ op, text, id, status = 'done' }) {
+    if (op === 'add') {
+      if (!text) return 'Error: text required for add';
+      _todoId++;
+      _todos.push({ id: _todoId, text, status: 'pending' });
+    } else if (op === 'complete') {
+      const todo = _todos.find(t => t.id === id);
+      if (!todo) return `Error: todo #${id} not found`;
+      todo.status = status;
+    } else if (op === 'delete') {
+      const idx = _todos.findIndex(t => t.id === id);
+      if (idx === -1) return `Error: todo #${id} not found`;
+      _todos.splice(idx, 1);
+    }
+    // Always return current list
+    if (_todos.length === 0) return 'Todo list is empty.';
+    const icons = { pending: '○', in_progress: '◉', done: '✓' };
+    return _todos.map(t => `${icons[t.status] || '○'} [${t.id}] ${t.text}`).join('\n');
+  }
+};
+// ── ASK USER ──────────────────────────────────────────────────────────────────
+// This tool is a signal — the agent loop in index.js intercepts it and prompts the user
+export const AskUserTool = {
+  name: 'AskUser',
+  description: `Ask the user a clarifying question and wait for their answer. Use this when you are genuinely blocked and need input that cannot be inferred.
+Only use when:
+- Multiple valid approaches exist with meaningfully different outcomes
+- Required information cannot be found in the codebase, env, or context
+- A destructive or irreversible action needs explicit confirmation
+Do NOT use for:
+- Things you can infer from context
+- Choices that don't materially affect the outcome
+- Asking if you should proceed (just proceed)`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      question: { type: 'string', description: 'The question to ask the user' }
+    },
+    required: ['question']
+  },
+  async run({ question }) {
+    // The agent loop intercepts this and handles the actual prompt.
+    // Return value here is fallback only.
+    return `[AskUser] ${question}`;
+  }
+};
+// ── WEB SEARCH ────────────────────────────────────────────────────────────────
+export const WebSearchTool = {
+  name: 'WebSearch',
+  description: `Search the web and return results. Use when you need current information, documentation, error solutions, or anything not in the codebase.
+Returns titles, URLs, and snippets for the top results. Follow up with WebFetch on a specific result to get the full content.`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      query: { type: 'string', description: 'Search query' },
+      num_results: { type: 'number', description: 'Number of results to return (default 8, max 20)' }
+    },
+    required: ['query']
+  },
+  async run({ query, num_results = 8 }) {
+    try {
+      const n = Math.min(num_results, 20);
+      const url = `https://html.duckduckgo.com/html/?q=${encodeURIComponent(query)}`;
+      const controller = new AbortController();
+      const timer = setTimeout(() => controller.abort(), 12000);
+      const res = await fetch(url, {
+        signal: controller.signal,
+        headers: {
+          'User-Agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36',
+          'Accept': 'text/html'
+        }
+      });
+      clearTimeout(timer);
+      if (!res.ok) return `Error: HTTP ${res.status}`;
+      const html = await res.text();
+      // Parse results from DuckDuckGo HTML
+      const results = [];
+      const resultBlocks = html.match(/<div class="result[^"]*"[\s\S]*?<\/div>\s*<\/div>/g) || [];
+      for (const block of resultBlocks.slice(0, n)) {
+        const titleMatch = block.match(/<a[^>]+class="result__a"[^>]*>([\s\S]*?)<\/a>/);
+        const urlMatch = block.match(/href="([^"]+)"/);
+        const snippetMatch = block.match(/<a[^>]+class="result__snippet"[^>]*>([\s\S]*?)<\/a>/);
+        const title = titleMatch ? titleMatch[1].replace(/<[^>]+>/g, '').trim() : '';
+        const href = urlMatch ? urlMatch[1] : '';
+        const snippet = snippetMatch ? snippetMatch[1].replace(/<[^>]+>/g, '').trim() : '';
+        // DuckDuckGo uses redirect URLs — extract the actual URL
+        const actualUrl = href.includes('uddg=')
+          ? decodeURIComponent(href.match(/uddg=([^&]+)/)?.[1] || href)
+          : href;
+        if (title && actualUrl) {
+          results.push(`${results.length + 1}. ${title}\n   ${actualUrl}\n   ${snippet}`);
+        }
+      }
+      if (results.length === 0) return `No results found for: ${query}`;
+      return `Search results for "${query}":\n\n${results.join('\n\n')}`;
+    } catch (e) {
+      if (e.name === 'AbortError') return 'Error: Search timed out';
+      return `Error: ${e.message}`;
+    }
+  }
+};
+// ── AGENT TOOL ────────────────────────────────────────────────────────────────
+// Circular import prevention — agentLoop is injected at runtime by loop.js
+let _agentLoopRef = null;
+export function injectAgentLoop(fn) { _agentLoopRef = fn; }
+export const AgentTool = {
+  name: 'Agent',
+  description: `Launch a sub-agent to handle an independent task in parallel. The sub-agent has access to all the same tools (Bash, Read, Write, Edit, Glob, Grep, WebFetch, WebSearch, etc.) and works autonomously until done.
+USE THIS FOR:
+- Independent subtasks that don't depend on each other (run multiple Agents in one response)
+- Long-running research tasks you don't want in the main context
+- Isolated operations (e.g. "analyze file A" + "analyze file B" simultaneously)
+The agent returns a summary of what it did and what it found. Keep the task description specific and self-contained — the sub-agent has no knowledge of the current conversation.
+IMPORTANT: You can call Agent multiple times in one response to run tasks truly in parallel.`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      task: { type: 'string', description: 'Complete, self-contained task description for the sub-agent' },
+      serverUrl: { type: 'string', description: 'Override server URL (optional)' }
+    },
+    required: ['task']
+  },
+  async run({ task, serverUrl }) {
+    if (!_agentLoopRef) return 'Error: AgentTool not initialized (no agent loop reference)';
+    if (!_currentServerUrl) return 'Error: AgentTool not initialized (no server URL)';
+    const url = serverUrl || _currentServerUrl;
+    const subMessages = [
+      { role: 'system', content: _agentSystemPrompt || 'You are a capable software engineering sub-agent. Complete the given task fully and return a summary of what you did.' },
+      { role: 'user', content: task }
+    ];
+    const outputTokens = [];
+    let done = false;
+    try {
+      await _agentLoopRef(
+        url,
+        subMessages,
+        (token) => { outputTokens.push(token); },
+        () => {}, // tool call display — silent in sub-agent
+        null, // no session info for sub-agents
+        null, // no confirm callback
+        10    // max iterations
+      );
+      done = true;
+    } catch (e) {
+      return `Sub-agent error: ${e.message}`;
+    }
+    // Find the last assistant message as the result
+    const lastAssistant = [...subMessages].reverse().find(m => m.role === 'assistant');
+    const result = lastAssistant?.content || outputTokens.join('');
+    return `[Sub-agent result]\n${String(result).slice(0, 6000)}`;
+  }
+};
+// Server URL + system prompt injected by loop.js at startup
+let _currentServerUrl = null;
+let _agentSystemPrompt = null;
+export function injectServerContext(serverUrl, systemPrompt) {
+  _currentServerUrl = serverUrl;
+  _agentSystemPrompt = systemPrompt;
+}
+// ── SNIP TOOL ─────────────────────────────────────────────────────────────────
+// The model calls this to surgically remove specific turns from context
+// loop.js handles the actual splice — this is a signal tool
+export const SnipTool = {
+  name: 'Snip',
+  description: `Remove specific conversation turns from context to free up space, without losing the whole conversation like /compact does.
+Use when:
+- A specific tool result was very large and is no longer needed (e.g. a full file read you've already processed)
+- An early exploration phase produced lots of output that's no longer relevant
+- You want to keep recent context but drop stale earlier parts
+The 'indices' are 0-based positions in the conversation (0 = first user message after system prompt).
+Use /status to see current message count, then pick which to snip.`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      indices: {
+        type: 'array',
+        items: { type: 'number' },
+        description: 'Array of 0-based message indices to remove from context'
+      },
+      reason: { type: 'string', description: 'Why you are snipping these (logged for transparency)' }
+    },
+    required: ['indices']
+  },
+  async run({ indices, reason }) {
+    // Actual snipping happens in agentLoop — this signals intent
+    return JSON.stringify({ __snip__: true, indices, reason: reason || 'context management' });
+  }
+};
+// ── BRIEF TOOL ────────────────────────────────────────────────────────────────
+export const BriefTool = {
+  name: 'Brief',
+  description: `Write a self-briefing note to yourself about the current task state. This gets injected into context on the next turn, ensuring nothing is forgotten even if context is trimmed.
+Use after major milestones in long tasks. Different from Checkpoint — Brief is for your own working memory, not user-visible progress.
+Example:
+  Brief({ content: "Working on auth refactor. Done: DB schema updated, sessions table migrated. Current: updating login route. Not done: logout, password reset. Key discovery: sessions table uses TEXT not UUID for user_id — do not cast." })`,
+  input_schema: {
+    type: 'object',
+    properties: {
+      content: { type: 'string', description: 'Your working memory note — what you know, what is done, what is next, what to watch out for' }
+    },
+    required: ['content']
+  },
+  async run({ content }) {
+    try {
+      if (!_sessionDir) return 'Brief recorded (no session initialized)';
+      // Reuse checkpoint mechanism — both go to session context
+      updateContext(_sessionDir, `[BRIEF]\n${content}`);
+      return 'Brief saved to working memory.';
+    } catch (e) {
+      return `Brief recorded (write failed: ${e.message})`;
+    }
+  }
+};
+export const ALL_TOOLS = [
+  BashTool, ReadTool, WriteTool, EditTool, GlobTool, GrepTool,
+  NoteTool, CheckpointTool,
+  WebFetchTool, WebSearchTool,
+  TodoWriteTool, AskUserTool,
+  AgentTool, SnipTool, BriefTool
+];

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "tsunami-code",
-  "version": "2.8.0",
+  "version": "3.0.0",
   "description": "Tsunami Code CLI — AI coding agent by Keystone World Management Navy Seal Unit XI3",
   "type": "module",
   "bin": {