npm - @hasna/terminal - Versions diffs - 2.3.2 → 3.1.0 - Mend

@hasna/terminal 2.3.2 → 3.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

package/dist/ai.js +78 -85
package/dist/cache.js +3 -2
package/dist/cli.js +1 -1
package/dist/compression.js +8 -30
package/dist/context-hints.js +20 -10
package/dist/diff-cache.js +1 -1
package/dist/discover.js +1 -1
package/dist/economy.js +37 -5
package/dist/expand-store.js +7 -1
package/dist/mcp/server.js +44 -68
package/dist/output-processor.js +10 -7
package/dist/providers/anthropic.js +6 -2
package/dist/providers/cerebras.js +6 -93
package/dist/providers/groq.js +6 -93
package/dist/providers/index.js +85 -36
package/dist/providers/openai-compat.js +93 -0
package/dist/providers/xai.js +6 -93
package/dist/tokens.js +17 -0
package/dist/tool-profiles.js +9 -2
package/package.json +1 -1
package/src/ai.ts +83 -94
package/src/cache.ts +3 -2
package/src/cli.tsx +1 -1
package/src/compression.ts +8 -35
package/src/context-hints.ts +20 -10
package/src/diff-cache.ts +1 -1
package/src/discover.ts +1 -1
package/src/economy.ts +37 -5
package/src/expand-store.ts +8 -1
package/src/mcp/server.ts +45 -73
package/src/output-processor.ts +11 -8
package/src/providers/anthropic.ts +6 -2
package/src/providers/base.ts +2 -0
package/src/providers/cerebras.ts +6 -105
package/src/providers/groq.ts +6 -105
package/src/providers/index.ts +84 -33
package/src/providers/openai-compat.ts +109 -0
package/src/providers/xai.ts +6 -105
package/src/tokens.ts +18 -0
package/src/tool-profiles.ts +9 -2
package/src/compression.test.ts +0 -49
package/src/output-router.ts +0 -56
package/src/parsers/base.ts +0 -72
package/src/parsers/build.ts +0 -73
package/src/parsers/errors.ts +0 -107
package/src/parsers/files.ts +0 -91
package/src/parsers/git.ts +0 -101
package/src/parsers/index.ts +0 -66
package/src/parsers/parsers.test.ts +0 -153
package/src/parsers/tests.ts +0 -98

package/dist/providers/openai-compat.js ADDED Viewed

@@ -0,0 +1,93 @@
+// Shared base class for OpenAI-compatible providers (Cerebras, Groq, xAI)
+// Eliminates ~200 lines of duplicated streaming SSE parsing
+export class OpenAICompatibleProvider {
+    get apiKey() {
+        return process.env[this.apiKeyEnvVar] ?? "";
+    }
+    isAvailable() {
+        return !!process.env[this.apiKeyEnvVar];
+    }
+    async complete(prompt, options) {
+        const res = await fetch(`${this.baseUrl}/chat/completions`, {
+            method: "POST",
+            headers: {
+                "Content-Type": "application/json",
+                Authorization: `Bearer ${this.apiKey}`,
+            },
+            body: JSON.stringify({
+                model: options.model ?? this.defaultModel,
+                max_tokens: options.maxTokens ?? 256,
+                temperature: options.temperature ?? 0,
+                ...(options.stop ? { stop: options.stop } : {}),
+                messages: [
+                    { role: "system", content: options.system },
+                    { role: "user", content: prompt },
+                ],
+            }),
+        });
+        if (!res.ok) {
+            const text = await res.text();
+            throw new Error(`${this.name} API error ${res.status}: ${text}`);
+        }
+        const json = (await res.json());
+        return (json.choices?.[0]?.message?.content ?? "").trim();
+    }
+    async stream(prompt, options, callbacks) {
+        const res = await fetch(`${this.baseUrl}/chat/completions`, {
+            method: "POST",
+            headers: {
+                "Content-Type": "application/json",
+                Authorization: `Bearer ${this.apiKey}`,
+            },
+            body: JSON.stringify({
+                model: options.model ?? this.defaultModel,
+                max_tokens: options.maxTokens ?? 256,
+                temperature: options.temperature ?? 0,
+                stream: true,
+                ...(options.stop ? { stop: options.stop } : {}),
+                messages: [
+                    { role: "system", content: options.system },
+                    { role: "user", content: prompt },
+                ],
+            }),
+        });
+        if (!res.ok) {
+            const text = await res.text();
+            throw new Error(`${this.name} API error ${res.status}: ${text}`);
+        }
+        let result = "";
+        const reader = res.body?.getReader();
+        if (!reader)
+            throw new Error("No response body");
+        const decoder = new TextDecoder();
+        let buffer = "";
+        while (true) {
+            const { done, value } = await reader.read();
+            if (done)
+                break;
+            buffer += decoder.decode(value, { stream: true });
+            const lines = buffer.split("\n");
+            buffer = lines.pop() ?? "";
+            for (const line of lines) {
+                const trimmed = line.trim();
+                if (!trimmed.startsWith("data: "))
+                    continue;
+                const data = trimmed.slice(6);
+                if (data === "[DONE]")
+                    break;
+                try {
+                    const parsed = JSON.parse(data);
+                    const delta = parsed.choices?.[0]?.delta?.content;
+                    if (delta) {
+                        result += delta;
+                        callbacks.onToken(result.trim());
+                    }
+                }
+                catch {
+                    // skip malformed chunks
+                }
+            }
+        }
+        return result.trim();
+    }
+}

package/dist/providers/xai.js CHANGED Viewed

@@ -1,95 +1,8 @@
-// xAI/Grok provider — uses OpenAI-compatible API
-// grok-code-fast-1 for code tasks, grok-4-fast for general queries.
-const XAI_BASE_URL = "https://api.x.ai/v1";
-const DEFAULT_MODEL = "grok-code-fast-1";
-export class XaiProvider {
+// xAI/Grok provider — code-optimized models
+import { OpenAICompatibleProvider } from "./openai-compat.js";
+export class XaiProvider extends OpenAICompatibleProvider {
     name = "xai";
-    apiKey;
-    constructor() {
-        this.apiKey = process.env.XAI_API_KEY ?? "";
-    }
-    isAvailable() {
-        return !!process.env.XAI_API_KEY;
-    }
-    async complete(prompt, options) {
-        const model = options.model ?? DEFAULT_MODEL;
-        const res = await fetch(`${XAI_BASE_URL}/chat/completions`, {
-            method: "POST",
-            headers: {
-                "Content-Type": "application/json",
-                Authorization: `Bearer ${this.apiKey}`,
-            },
-            body: JSON.stringify({
-                model,
-                max_tokens: options.maxTokens ?? 256,
-                messages: [
-                    { role: "system", content: options.system },
-                    { role: "user", content: prompt },
-                ],
-            }),
-        });
-        if (!res.ok) {
-            const text = await res.text();
-            throw new Error(`xAI API error ${res.status}: ${text}`);
-        }
-        const json = (await res.json());
-        return (json.choices?.[0]?.message?.content ?? "").trim();
-    }
-    async stream(prompt, options, callbacks) {
-        const model = options.model ?? DEFAULT_MODEL;
-        const res = await fetch(`${XAI_BASE_URL}/chat/completions`, {
-            method: "POST",
-            headers: {
-                "Content-Type": "application/json",
-                Authorization: `Bearer ${this.apiKey}`,
-            },
-            body: JSON.stringify({
-                model,
-                max_tokens: options.maxTokens ?? 256,
-                stream: true,
-                messages: [
-                    { role: "system", content: options.system },
-                    { role: "user", content: prompt },
-                ],
-            }),
-        });
-        if (!res.ok) {
-            const text = await res.text();
-            throw new Error(`xAI API error ${res.status}: ${text}`);
-        }
-        let result = "";
-        const reader = res.body?.getReader();
-        if (!reader)
-            throw new Error("No response body");
-        const decoder = new TextDecoder();
-        let buffer = "";
-        while (true) {
-            const { done, value } = await reader.read();
-            if (done)
-                break;
-            buffer += decoder.decode(value, { stream: true });
-            const lines = buffer.split("\n");
-            buffer = lines.pop() ?? "";
-            for (const line of lines) {
-                const trimmed = line.trim();
-                if (!trimmed.startsWith("data: "))
-                    continue;
-                const data = trimmed.slice(6);
-                if (data === "[DONE]")
-                    break;
-                try {
-                    const parsed = JSON.parse(data);
-                    const delta = parsed.choices?.[0]?.delta?.content;
-                    if (delta) {
-                        result += delta;
-                        callbacks.onToken(result.trim());
-                    }
-                }
-                catch {
-                    // skip malformed chunks
-                }
-            }
-        }
-        return result.trim();
-    }
+    baseUrl = "https://api.x.ai/v1";
+    defaultModel = "grok-code-fast-1";
+    apiKeyEnvVar = "XAI_API_KEY";
 }

package/dist/tokens.js ADDED Viewed

@@ -0,0 +1,17 @@
+// Token estimation utility — shared across all modules
+// Uses content-aware heuristic: code/JSON averages ~3.3 chars/token,
+// English prose averages ~4.2 chars/token.
+/** Detect if content is primarily code/JSON vs English prose */
+function isCodeLike(text) {
+    // Count structural characters common in code/JSON
+    const structural = (text.match(/[{}[\]();:=<>,"'`|&\\/@#$%^*+~!?]/g) || []).length;
+    const ratio = structural / Math.max(text.length, 1);
+    return ratio > 0.08; // >8% structural chars = code-like
+}
+/** Estimate token count for a string with content-aware heuristic */
+export function estimateTokens(text) {
+    if (!text)
+        return 0;
+    const charsPerToken = isCodeLike(text) ? 3.3 : 4.2;
+    return Math.ceil(text.length / charsPerToken);
+}

package/dist/tool-profiles.js CHANGED Viewed

@@ -88,12 +88,19 @@ function loadUserProfiles() {
     catch { }
     return profiles;
 }
-/** Get all profiles — user profiles override builtins by name */
+/** Get all profiles — user profiles override builtins by name (cached 30s) */
+let _cachedProfiles = null;
+let _cachedProfilesAt = 0;
 export function getProfiles() {
+    const now = Date.now();
+    if (_cachedProfiles && now - _cachedProfilesAt < 30_000)
+        return _cachedProfiles;
     const user = loadUserProfiles();
     const userNames = new Set(user.map(p => p.name));
     const builtins = BUILTIN_PROFILES.filter(p => !userNames.has(p.name));
-    return [...user, ...builtins];
+    _cachedProfiles = [...user, ...builtins];
+    _cachedProfilesAt = now;
+    return _cachedProfiles;
 }
 /** Find the matching profile for a command */
 export function matchProfile(command) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@hasna/terminal",
-  "version": "2.3.2",
+  "version": "3.1.0",
   "description": "Smart terminal wrapper for AI agents and humans — structured output, token compression, MCP server, natural language",
   "type": "module",
   "files": [

package/src/ai.ts CHANGED Viewed

@@ -26,16 +26,25 @@ const MODEL_DEFAULTS: Record<string, { fast: string; smart: string }> = {
   anthropic: { fast: "claude-haiku-4-5-20251001",       smart: "claude-sonnet-4-6" },
 };
-/** Load user model overrides from ~/.terminal/config.json */
+/** Load user model overrides from ~/.terminal/config.json (cached 30s) */
+let _modelOverrides: Record<string, { fast?: string; smart?: string }> | null = null;
+let _modelOverridesAt = 0;
 function loadModelOverrides(): Record<string, { fast?: string; smart?: string }> {
+  const now = Date.now();
+  if (_modelOverrides && now - _modelOverridesAt < 30_000) return _modelOverrides;
   try {
     const configPath = join(process.env.HOME ?? "~", ".terminal", "config.json");
     if (existsSync(configPath)) {
       const config = JSON.parse(readFileSync(configPath, "utf8"));
-      return config.models ?? {};
+      _modelOverrides = config.models ?? {};
+      _modelOverridesAt = now;
+      return _modelOverrides!;
     }
   } catch {}
-  return {};
+  _modelOverrides = {};
+  _modelOverridesAt = now;
+  return _modelOverrides;
 }
 /** Model routing per provider — config-driven with defaults */
@@ -148,6 +157,8 @@ function detectProjectContext(): string {
 // ── system prompt ─────────────────────────────────────────────────────────────
 function buildSystemPrompt(perms: Permissions, sessionEntries: SessionEntry[], currentPrompt?: string): string {
+  const nl = currentPrompt?.toLowerCase() ?? "";
   const restrictions: string[] = [];
   if (!perms.destructive)
     restrictions.push("- NEVER generate commands that delete, remove, or overwrite files/data");
@@ -178,7 +189,6 @@ function buildSystemPrompt(perms: Permissions, sessionEntries: SessionEntry[], c
   const projectContext = detectProjectContext();
-  // Inject safety hints for the command being generated (AI sees what's risky)
   const safetyBlock = sessionEntries.length > 0
     ? (() => {
         const lastCmd = sessionEntries[sessionEntries.length - 1]?.cmd;
@@ -190,72 +200,53 @@ function buildSystemPrompt(perms: Permissions, sessionEntries: SessionEntry[], c
       })()
     : "";
-  return `You are a terminal assistant. Output ONLY the exact shell command — no explanation, no markdown, no backticks.
-The user describes what they want in plain English. You translate to the exact shell command.
-RULES:
-- SIMPLICITY FIRST: Use the simplest command that works. Prefer grep | sort | head over 10-pipe chains. Complex pipelines are OK when needed, but NEVER pass file:line output to wc or xargs without cleaning it first.
-- ALWAYS use grep -rn (with -r) when searching directories. NEVER use grep without -r on src/ or any directory.
-- When user refers to items from previous output, use the EXACT names shown (e.g., "feature/auth" not "auth", "open-skills" not "open_skills")
-- When user says "the largest/smallest/first/second", look at the previous output to identify the correct item
-- When user says "them all" or "combine them", refer to items from the most recent command output
-- For "show who changed each line" use git blame, for "show remote urls" use git remote -v
-- For text search in code, use grep -rn, NOT nm or objdump (those are for compiled binaries)
-- On macOS: for memory use vm_stat or top -l 1, for disk use df -h, for processes use ps aux
-- macOS uses BSD tools, NOT GNU. Use: du -d 1 (not --max-depth), ls (not ls --color), sort -r (not sort --reverse), ps aux (not ps --sort)
-- NEVER use grep -P (PCRE). macOS grep has NO -P flag. Use grep -E for extended regex, or sed/awk for complex extraction.
-- NEVER invent commands that don't exist. Stick to standard Unix/macOS commands.
-- NEVER install packages (npx, npm install, pip install, brew install). This is a READ-ONLY terminal.
-- NEVER modify source code (sed -i, codemod, awk with redirect). Only observe, never change.
-- Search src/ directory, NOT dist/ or node_modules/ for code queries.
-- Use exact file paths from the project context below. Do NOT guess paths.
-- For "what would break if I deleted X": use grep -rn "from.*X\\|import.*X\\|require.*X" src/ to find all importers.
-- For "find where X is defined": use grep -rn "export.*function X\\|export.*class X\\|export.*const X" src/
-- For "show me the code of function X": if you know the file, use grep -A 30 "function X" src/file.ts. If not, use grep -rn -A 30 "function X" src/ --include="*.ts"
-- ALWAYS use grep -rn (recursive) when searching directories. NEVER use grep without -r on a directory — it will fail.
-- For conceptual questions about what code does: use cat on the relevant file, the AI summary will explain it.
-- For DESTRUCTIVE requests (delete, remove, install, push): output BLOCKED: <reason>. NEVER try to execute destructive commands.
-AST-POWERED QUERIES: For code STRUCTURE questions, use the built-in AST tool instead of grep:
-- "find all exported functions" → terminal symbols src/ (lists all functions, classes, interfaces with line numbers)
-- "show all interfaces" → terminal symbols src/ | grep interface
-- "what does file X export" → terminal symbols src/file.ts
-- "show me the class hierarchy" → terminal symbols src/
-The "terminal symbols" command uses AST parsing (not regex) — it understands TypeScript, Python, Go, Rust code structure.
-For TEXT search (TODO, string matches, imports) → use grep as normal.
-COMPOUND QUESTIONS: For questions asking multiple things, prefer ONE command that captures all info. Extract multiple answers from a single output.
-- "how many tests and do they pass" → bun test (extract count AND pass/fail from output)
-- "what files changed and how many lines" → git log --stat -3 (shows files AND line counts)
-- "what version of node and bun" → node -v && bun -v (only use && for trivial non-failing commands)
-NEVER split into separate test runs or expensive commands chained with &&.
-BLOCKED ALTERNATIVES: If your preferred command would require installing packages (npx, npm install), ALWAYS try a READ-ONLY alternative:
-- Code quality analysis → grep -rn "TODO\\|FIXME\\|HACK\\|XXX" src/
-- Linting → check if "lint" or "typecheck" exists in package.json scripts, run that
-- Security scan → grep -rn "eval\\|exec\\|spawn\\|password\\|secret" src/
-- Dependency audit → cat package.json | grep -A 50 dependencies
-- Test coverage → bun test --coverage (or npm run test:coverage if available)
-NEVER give up. NEVER output BLOCKED for analysis questions. Always try a grep/find/cat/wc/awk read-only alternative.
-- Cyclomatic complexity → grep -rn "if\\|else\\|for\\|while\\|switch\\|case\\|catch\\|&&\\|||" src/ --include="*.ts" | wc -l
-- Unused exports → grep -rn "export function\|export const\|export class" src/ --include="*.ts" | sed 's/.*export [a-z]* //' | sed 's/[(<:].*//' | sort -u
-- Dead code → for each exported name, grep -rn "name" src/ --include="*.ts" | wc -l (if only 1 match = unused)
-- Dependency graph → grep -rn "from " src/ --include="*.ts" | sed 's/:.*from "/→/' | sed 's/".*//' | sort -u
-- Most parameters → grep -rn "function " src/ --include="*.ts" | awk -F'[()]' '{print gsub(/,/,",",$2)+1, $0}' | sort -nr | head -10
-ALWAYS try a heuristic shell approach before giving up. NEVER say BLOCKED for analysis questions.
-SEMANTIC MAPPING: When the user references a concept, search the file tree for RELATED terms:
-- Look at directory names: src/agent/ likely contains "agentic" code
-- Look at file names: lazy-executor.ts likely handles "lazy mode"
-- When uncertain: grep -rn "keyword" src/ --include="*.ts" -l (list matching files)
-ACTION vs CONCEPTUAL: If the prompt starts with "run", "execute", "check", "test", "build", "show output of" — ALWAYS generate an executable command. NEVER read README for action requests. Only read docs for "explain why", "what does X mean", "how was X designed".
-EXISTENCE CHECKS: If the prompt starts with "is there", "does this have", "do we have", "does X exist" — NEVER run/start/launch anything. Use ls, find, or test -d to CHECK existence. These are READ-ONLY questions.
-MONOREPO: If the project context says "MONOREPO", search packages/ or apps/ NOT src/. Use: grep -rn "pattern" packages/ --include="*.ts". For specific packages, use packages/PKGNAME/src/.
+  // ── Conditional sections (only included when relevant) ──
+  const wantsStructure = /\b(function|class|interface|export|symbol|structure|hierarchy|outline)\b/i.test(nl);
+  const astBlock = wantsStructure ? `\nAST-POWERED QUERIES: For code STRUCTURE questions, use "terminal symbols" instead of grep. It uses AST parsing for TypeScript, Python, Go, Rust.` : "";
+  const wantsMultiple = /\b(and|both|also|plus|as well)\b/i.test(nl);
+  const compoundBlock = wantsMultiple ? `\nCOMPOUND QUESTIONS: Prefer ONE command that captures all info. NEVER split into separate expensive commands.` : "";
+  const wantsAnalysis = /\b(quality|lint|coverage|complexity|unused|dead code|security|audit|scan|dependency)\b/i.test(nl);
+  const blockedAltBlock = wantsAnalysis ? `\nBLOCKED ALTERNATIVES: If your preferred command needs installing packages, try READ-ONLY alternatives (grep, cat, wc, awk). NEVER give up on analysis questions.` : "";
+  return `Translate to bash. One command. Simplest form. No explanation.
+list files in current directory → ls
+list all files including hidden → ls -a
+show open files → lsof
+create copy of a.txt as b.txt → cp a.txt b.txt
+create file test.txt → touch test.txt
+make directory testdir → mkdir testdir
+display routing table → route
+show last logged in users → last
+show file stats → stat file
+print directory tree 2 levels → tree -L 2
+count word occurrences in file → grep -c "word" file
+print number of files in dir → ls -1 | wc -l
+print first line of file → head -1 file
+print last line of file → tail -1 file
+print lines 3 to 5 of file → sed -n '3,5p' file
+print every other line → awk 'NR%2==1' file
+count words in file → wc -w file
+find empty files not in subdirs → find . -maxdepth 1 -type f -empty
+show system load → w
+system utilization stats → vmstat
+DNS servers → cat /etc/resolv.conf | grep nameserver
+long integer size → getconf LONG_BIT
+base64 decode string → echo 'str' | base64 -d
+change owner to nobody → chown nobody file
+unique lines in file → uniq file
+max cpu time → ulimit -t
+memory info → lsmem
+process priority → nice
+bash profile → cat ~/.bashrc
+search recursively → grep -rn "pattern" src/
+${astBlock}${compoundBlock}${blockedAltBlock}
 cwd: ${process.cwd()}
-shell: zsh / macOS${projectContext}${safetyBlock}${restrictionBlock}${contextBlock}${currentPrompt ? loadCorrectionHints(currentPrompt) : ""}`;
+shell: zsh / macOS${projectContext}${safetyBlock}${restrictionBlock}${contextBlock}${currentPrompt ? loadCorrectionHints(currentPrompt) : ""}
+Q:`;
 }
 // ── streaming translate ───────────────────────────────────────────────────────
@@ -280,11 +271,11 @@ export async function translateToCommand(
   let text: string;
   if (onToken) {
-    text = await provider.stream(nl, { model, maxTokens: 256, system }, {
+    text = await provider.stream(nl, { model, maxTokens: 256, temperature: 0, stop: ["\n"], system }, {
       onToken: (partial) => onToken(partial),
     });
   } else {
-    text = await provider.complete(nl, { model, maxTokens: 256, system });
+    text = await provider.complete(nl, { model, maxTokens: 256, temperature: 0, stop: ["\n"], system });
   }
   if (text.startsWith("BLOCKED:")) throw new Error(text);
@@ -334,6 +325,7 @@ export async function explainCommand(command: string): Promise<string> {
   return provider.complete(command, {
     model: routing.fast,
     maxTokens: 128,
+    temperature: 0,
     system: "Explain what this shell command does in one plain English sentence. No markdown, no code blocks.",
   });
 }
@@ -345,37 +337,34 @@ export async function fixCommand(
   failedCommand: string,
   errorOutput: string,
   perms: Permissions,
-  sessionEntries: SessionEntry[]
+  _sessionEntries: SessionEntry[]
 ): Promise<string> {
   const provider = getProvider();
   const routing = pickModel(originalNl);
+  // Lightweight fix prompt — no full project context, just rules + restrictions
+  const restrictions: string[] = [];
+  if (!perms.destructive) restrictions.push("- NEVER delete/remove/overwrite files");
+  if (!perms.network) restrictions.push("- NEVER make network requests");
+  if (!perms.install) restrictions.push("- NEVER install packages");
+  const fixSystem = `You are a terminal assistant. Output ONLY the corrected shell command — no explanation.
+macOS/BSD tools. NEVER use grep -P. Use grep -E for extended regex.
+NEVER install packages. READ-ONLY terminal.
+cwd: ${process.cwd()}${restrictions.length > 0 ? `\nRESTRICTIONS:\n${restrictions.join("\n")}` : ""}`;
   const text = await provider.complete(
-    `I wanted to: ${originalNl}\nI ran: ${failedCommand}\nError:\n${errorOutput}\n\nGive me the corrected command only.`,
+    `I wanted to: ${originalNl}\nI ran: ${failedCommand}\nError:\n${errorOutput.slice(0, 2000)}\n\nGive me the corrected command only.`,
     {
-      model: routing.smart, // always use smart model for fixes
+      model: routing.smart,
       maxTokens: 256,
-      system: buildSystemPrompt(perms, sessionEntries, originalNl),
+      temperature: 0,
+      stop: ["\n"],
+      system: fixSystem,
     }
   );
   if (text.startsWith("BLOCKED:")) throw new Error(text);
-  return text;
+  return text.trim();
 }
-// ── summarize output (for MCP/agent use) ──────────────────────────────────────
-export async function summarizeOutput(
-  command: string,
-  output: string,
-  maxTokens: number = 200
-): Promise<string> {
-  const provider = getProvider();
-  const routing = pickModel("summarize");
-  return provider.complete(
-    `Command: ${command}\nOutput:\n${output}\n\nSummarize this output concisely for an AI agent. Focus on: status, key results, errors. Be terse.`,
-    {
-      model: routing.fast,
-      maxTokens,
-      system: "You summarize command output for AI agents. Be extremely concise. Return structured info. No prose.",
-    }
-  );
-}
+// summarizeOutput() removed — all output processing goes through processOutput() in output-processor.ts

package/src/cache.ts CHANGED Viewed

@@ -20,12 +20,13 @@ function persistCache() {
   try { writeFileSync(CACHE_FILE, JSON.stringify(mem)); } catch {}
 }
-/** Normalize a natural language query for cache lookup */
+/** Normalize a natural language query for cache lookup.
+ *  Keeps . / - _ which are meaningful in file paths and shell context. */
 export function normalizeNl(nl: string): string {
   return nl
     .toLowerCase()
     .trim()
-    .replace(/[^a-z0-9\s]/g, "")   // strip punctuation
+    .replace(/[^a-z0-9\s.\/_-]/g, "")   // keep meaningful shell chars
     .replace(/\s+/g, " ");
 }

package/src/cli.tsx CHANGED Viewed

@@ -446,7 +446,7 @@ else if (args.length > 0) {
   const { rewriteCommand } = await import("./command-rewriter.js");
   const { shouldBeLazy, toLazy } = await import("./lazy-executor.js");
   const { saveOutput, formatOutputHint } = await import("./output-store.js");
-  const { parseOutput, estimateTokens } = await import("./parsers/index.js");
+  const { estimateTokens } = await import("./tokens.js");
   const { recordSaving, recordUsage } = await import("./economy.js");
   const { isTestOutput, trackTests, formatWatchResult } = await import("./test-watchlist.js");
   const { detectLoop } = await import("./loop-detector.js");

package/src/compression.ts CHANGED Viewed

@@ -1,19 +1,18 @@
 // Token compression engine — reduces CLI output to fit within token budgets
+// No regex parsing — just ANSI stripping, deduplication, and smart truncation.
+// All intelligent output processing goes through AI via processOutput().
-import { parseOutput, estimateTokens, tokenSavings } from "./parsers/index.js";
+import { estimateTokens } from "./tokens.js";
 export interface CompressOptions {
   /** Max tokens for the output (default: unlimited) */
   maxTokens?: number;
-  /** Output format */
-  format?: "text" | "json" | "summary";
   /** Strip ANSI escape codes (default: true) */
   stripAnsi?: boolean;
 }
 export interface CompressedOutput {
   content: string;
-  format: "text" | "json" | "summary";
   originalTokens: number;
   compressedTokens: number;
   tokensSaved: number;
@@ -36,7 +35,6 @@ function deduplicateLines(lines: string[]): string[] {
   for (let i = 0; i < lines.length; i++) {
     const line = lines[i];
-    // Extract a "pattern" — the line without numbers, paths, specific identifiers
     const pattern = line.replace(/[0-9]+/g, "N").replace(/\/\S+/g, "/PATH").replace(/\s+/g, " ").trim();
     if (pattern === repeatPattern) {
@@ -45,7 +43,6 @@ function deduplicateLines(lines: string[]): string[] {
       if (repeatCount > 2) {
         result.push(`  ... (${repeatCount} similar lines)`);
       } else if (repeatCount > 0) {
-        // Push the skipped lines back
         for (let j = i - repeatCount; j < i; j++) {
           result.push(lines[j]);
         }
@@ -67,14 +64,13 @@ function deduplicateLines(lines: string[]): string[] {
   return result;
 }
-/** Smart truncation: keep first N + last M lines */
+/** Smart truncation: keep first 60% + last 40% of lines */
 function smartTruncate(text: string, maxTokens: number): string {
   const lines = text.split("\n");
   const currentTokens = estimateTokens(text);
   if (currentTokens <= maxTokens) return text;
-  // Keep proportional first/last, with first getting more
   const targetLines = Math.floor((maxTokens * lines.length) / currentTokens);
   const firstCount = Math.ceil(targetLines * 0.6);
   const lastCount = Math.floor(targetLines * 0.4);
@@ -88,42 +84,20 @@ function smartTruncate(text: string, maxTokens: number): string {
   return [...first, `\n--- ${hiddenCount} lines hidden ---\n`, ...last].join("\n");
 }
-/** Compress command output to fit within a token budget */
+/** Compress command output — ANSI strip, dedup, truncate. No parsing. */
 export function compress(command: string, output: string, options: CompressOptions = {}): CompressedOutput {
-  const { maxTokens, format = "text", stripAnsi: doStrip = true } = options;
+  const { maxTokens, stripAnsi: doStrip = true } = options;
   const originalTokens = estimateTokens(output);
   // Step 1: Strip ANSI codes
   let text = doStrip ? stripAnsi(output) : output;
-  // Step 2: Try structured parsing (format=json or when it saves tokens)
-  if (format === "json" || format === "summary") {
-    const parsed = parseOutput(command, text);
-    if (parsed) {
-      const json = JSON.stringify(parsed.data, null, format === "summary" ? 0 : 2);
-      const savings = tokenSavings(output, parsed.data);
-      const compressedTokens = estimateTokens(json);
-      // ONLY use JSON if it actually saves tokens (never return larger output)
-      if (savings.saved > 0 && (!maxTokens || compressedTokens <= maxTokens)) {
-        return {
-          content: json,
-          format: "json",
-          originalTokens,
-          compressedTokens,
-          tokensSaved: savings.saved,
-          savingsPercent: savings.percent,
-        };
-      }
-    }
-  }
-  // Step 3: Deduplicate similar lines
+  // Step 2: Deduplicate similar lines
   const lines = text.split("\n");
   const deduped = deduplicateLines(lines);
   text = deduped.join("\n");
-  // Step 4: Smart truncation if over budget
+  // Step 3: Smart truncation if over budget
   if (maxTokens) {
     text = smartTruncate(text, maxTokens);
   }
@@ -131,7 +105,6 @@ export function compress(command: string, output: string, options: CompressOptio
   const compressedTokens = estimateTokens(text);
   return {
     content: text,
-    format: "text",
     originalTokens,
     compressedTokens,
     tokensSaved: Math.max(0, originalTokens - compressedTokens),