npm - agent-sh - Versions diffs - 0.14.1 → 0.14.2 - Mend

agent-sh 0.14.1 → 0.14.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/dist/agent/agent-loop.d.ts +1 -1
package/dist/agent/agent-loop.js +42 -31
package/dist/agent/conversation-state.d.ts +3 -2
package/dist/agent/conversation-state.js +20 -3
package/dist/agent/events.d.ts +2 -0
package/dist/agent/host-types.d.ts +3 -0
package/dist/agent/index.js +2 -1
package/dist/agent/subagent.d.ts +1 -1
package/dist/agent/subagent.js +5 -1
package/dist/agent/tool-protocol.d.ts +2 -2
package/dist/agent/tool-protocol.js +5 -4
package/dist/agent/tools/glob.d.ts +1 -1
package/dist/agent/tools/glob.js +4 -2
package/dist/agent/tools/grep.d.ts +1 -1
package/dist/agent/tools/grep.js +4 -2
package/dist/agent/tools/ls.d.ts +1 -1
package/dist/agent/tools/ls.js +4 -2
package/dist/agent/tools/read-file.d.ts +1 -1
package/dist/agent/tools/read-file.js +30 -2
package/dist/agent/types.d.ts +11 -1
package/dist/agent/types.js +6 -1
package/dist/cli/index.js +0 -0
package/dist/core/index.d.ts +1 -1
package/dist/core/settings.d.ts +3 -0
package/dist/core/settings.js +2 -2
package/dist/shell/index.d.ts +6 -0
package/dist/shell/index.js +10 -10
package/dist/shell/shell.d.ts +4 -0
package/dist/shell/shell.js +15 -29
package/dist/shell/terminal.d.ts +33 -0
package/dist/shell/terminal.js +62 -0
package/examples/extensions/ash-scheme/index.ts +2170 -0
package/examples/extensions/ash-scheme/package.json +11 -0
package/examples/extensions/ash-scheme-render.ts +58 -0
package/examples/extensions/ashi/README.md +36 -26
package/examples/extensions/ashi/package.json +9 -1
package/examples/extensions/ashi/src/capture.ts +1 -0
package/examples/extensions/ashi/src/cli.ts +21 -7
package/examples/extensions/ashi/src/compaction.ts +25 -96
package/examples/extensions/ashi/src/components.ts +64 -166
package/examples/extensions/ashi/src/default-schema-renderers.ts +229 -0
package/examples/extensions/ashi/src/display-config.ts +21 -22
package/examples/extensions/ashi/src/frontend.ts +64 -65
package/examples/extensions/ashi/src/hooks.ts +47 -63
package/examples/extensions/ashi/src/multi-session-store.ts +44 -3
package/examples/extensions/ashi/src/schema.ts +407 -0
package/examples/extensions/ashi/src/session-store.ts +55 -4
package/examples/extensions/ashi/src/status-footer.ts +27 -6
package/examples/extensions/ashi-compact-llm.ts +93 -0
package/examples/extensions/claude-code-bridge/index.ts +2 -0
package/examples/extensions/opencode-bridge/index.ts +3 -0
package/examples/extensions/opencode-provider.ts +252 -0
package/examples/extensions/pi-bridge/index.ts +1 -0
package/package.json +12 -1
package/examples/extensions/ashi/src/default-renderers.ts +0 -171

package/dist/agent/agent-loop.d.ts CHANGED Viewed

@@ -15,7 +15,7 @@ import type { EventBus } from "../core/event-bus.js";
 import type { AgentMode } from "./host-types.js";
 import type { LlmClient } from "./llm-client.js";
 import type { HandlerFunctions } from "../utils/handler-registry.js";
-import type { AgentBackend, ToolDefinition } from "./types.js";
+import { type AgentBackend, type ToolDefinition } from "./types.js";
 import { type HistoryAdapter } from "./history-file.js";
 import type { Compositor } from "../utils/compositor.js";
 export interface AgentLoopConfig {

package/dist/agent/agent-loop.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { setMaxListeners } from "node:events";
 import * as path from "node:path";
+import { contentText } from "./types.js";
 import { ToolRegistry } from "./tool-registry.js";
 import { normalizeToolArgs } from "./normalize-args.js";
 import { ConversationState } from "./conversation-state.js";
@@ -244,9 +245,9 @@ export class AgentLoop {
             this.conversation = new ConversationState(this.handlers, this.instanceId);
             this.lastProjectSkillNames.clear();
         });
-        on("agent:compact-request", () => {
+        on("agent:compact-request", async () => {
             // Force compaction. Strategy lives behind `conversation:compact`.
-            const stats = this.compactWithHooks(0, 0, true);
+            const stats = await this.compactWithHooks(0, 0, true);
             if (stats) {
                 this.bus.emit("ui:info", {
                     message: `(compacted: ~${stats.before.toLocaleString()} → ~${stats.after.toLocaleString()} tokens)`,
@@ -454,13 +455,13 @@ export class AgentLoop {
      * compaction, emit `conversation:after-compact` so listeners
      * (metrics, UI, agent-awareness notes) can react.
      */
-    compactWithHooks(target, keepRecent, force, strategy) {
-        const stats = this.handlers.call("conversation:compact", {
+    async compactWithHooks(target, keepRecent, force, strategy) {
+        const stats = (await this.handlers.call("conversation:compact", {
             target,
             keepRecent,
             force: !!force,
             strategy,
-        });
+        }));
         if (stats) {
             this.bus.emit("conversation:after-compact", {
                 beforeTokens: stats.before,
@@ -597,7 +598,7 @@ export class AgentLoop {
             },
             formatResult: (args, result) => {
                 const action = args.action;
-                const text = result.content;
+                const text = contentText(result.content);
                 if (result.isError)
                     return { summary: "error" };
                 if (action === "search") {
@@ -658,6 +659,13 @@ export class AgentLoop {
             if (extensionSections.length > 0) {
                 parts.push("# Extension Instructions\n\n" + extensionSections.join("\n\n"));
             }
+            if (this.currentMode.modalities?.includes("image")) {
+                parts.push("# Image Support\n\n"
+                    + "This model supports image input. When you need visual information, "
+                    + "you can read image files (PNG, JPEG, GIF, WebP) with read_file — "
+                    + "they will be shown to you directly. Use this to inspect screenshots, "
+                    + "diagrams, UI mockups, charts, or any visual content relevant to the task.");
+            }
             return parts.join("\n\n");
         });
         // ── Orthogonal core-state accessors ──────────────────────────
@@ -838,6 +846,7 @@ export class AgentLoop {
             const label = tool.displayName ?? name;
             this.bus.emit("agent:tool-started", {
                 title: typeof args.description === "string" ? `${label}: ${args.description}` : label,
+                name,
                 toolCallId: id,
                 kind: display.kind, icon: display.icon, locations: display.locations, rawInput: args,
                 displayDetail: tool.formatCall?.(args),
@@ -878,7 +887,7 @@ export class AgentLoop {
                 resultDisplay,
             });
             this.bus.emit("agent:tool-output", {
-                tool: name, output: result.content, exitCode: result.exitCode,
+                tool: name, output: contentText(result.content), exitCode: result.exitCode,
             });
             return result;
         });
@@ -959,7 +968,7 @@ export class AgentLoop {
                 // Compact deeply — shallow targets buy only 1–2 turns of runway on
                 // tool-heavy workloads.
                 const target = Math.floor(threshold * 0.25);
-                const result = this.compactWithHooks(target, 1);
+                const result = await this.compactWithHooks(target, 1);
                 if (!result) {
                     // Auto-compact fired but nothing was evictable. This can happen
                     // in short conversations with heavy tool output where the pin
@@ -1081,6 +1090,7 @@ export class AgentLoop {
                         const display = tool.getDisplayInfo?.(args) ?? { kind: "execute" };
                         this.bus.emit("agent:tool-started", {
                             title: tool.displayName ?? tc.name,
+                            name: tc.name,
                             toolCallId: tc.id,
                             kind: display.kind, icon: display.icon, locations: display.locations, rawInput: args,
                             displayDetail: tool.formatCall?.(args),
@@ -1097,7 +1107,7 @@ export class AgentLoop {
                             resultDisplay,
                         });
                         this.bus.emit("agent:tool-output", {
-                            tool: tc.name, output: cached.content, exitCode: 0,
+                            tool: tc.name, output: contentText(cached.content), exitCode: 0,
                         });
                         collectedResults.push({
                             callId: tc.id, toolName: tc.name,
@@ -1114,29 +1124,30 @@ export class AgentLoop {
                 const result = await this.handlers.call("tool:execute", { name: tc.name, id: tc.id, args, tool, onChunk: defaultOnChunk,
                     batchIndex, batchTotal: batchTotal > 1 ? batchTotal : undefined,
                     signal });
-                // Truncate large outputs to avoid blowing context.
                 let content = result.content;
-                const maxBytes = tool.maxResultBytes ?? 100_000; // ~25k tokens
-                if (content.length > maxBytes) {
-                    const headBytes = Math.floor(maxBytes * 0.6);
-                    const tailBytes = maxBytes - headBytes;
-                    const lines = content.split("\n");
-                    let headEnd = 0, headLen = 0;
-                    for (let i = 0; i < lines.length && headLen + lines[i].length + 1 <= headBytes; i++) {
-                        headLen += lines[i].length + 1;
-                        headEnd = i + 1;
-                    }
-                    let tailStart = lines.length, tailLen = 0;
-                    for (let i = lines.length - 1; i >= headEnd && tailLen + lines[i].length + 1 <= tailBytes; i--) {
-                        tailLen += lines[i].length + 1;
-                        tailStart = i;
+                if (typeof content === "string") {
+                    const maxBytes = tool.maxResultBytes ?? 100_000; // ~25k tokens
+                    if (content.length > maxBytes) {
+                        const headBytes = Math.floor(maxBytes * 0.6);
+                        const tailBytes = maxBytes - headBytes;
+                        const lines = content.split("\n");
+                        let headEnd = 0, headLen = 0;
+                        for (let i = 0; i < lines.length && headLen + lines[i].length + 1 <= headBytes; i++) {
+                            headLen += lines[i].length + 1;
+                            headEnd = i + 1;
+                        }
+                        let tailStart = lines.length, tailLen = 0;
+                        for (let i = lines.length - 1; i >= headEnd && tailLen + lines[i].length + 1 <= tailBytes; i--) {
+                            tailLen += lines[i].length + 1;
+                            tailStart = i;
+                        }
+                        const omitted = tailStart - headEnd;
+                        content = [
+                            ...lines.slice(0, headEnd),
+                            `\n[… ${omitted} lines omitted (output truncated to ${Math.round(maxBytes / 1024)}KB) …]\n`,
+                            ...lines.slice(tailStart),
+                        ].join("\n");
                     }
-                    const omitted = tailStart - headEnd;
-                    content = [
-                        ...lines.slice(0, headEnd),
-                        `\n[… ${omitted} lines omitted (output truncated to ${Math.round(maxBytes / 1024)}KB) …]\n`,
-                        ...lines.slice(tailStart),
-                    ].join("\n");
                 }
                 const finalResult = {
                     callId: tc.id, toolName: tc.name,
@@ -1347,7 +1358,7 @@ export class AgentLoop {
                 if (this.isContextOverflow(e)) {
                     const contextWindow = this.currentMode.contextWindow ?? DEFAULT_CONTEXT_WINDOW;
                     const target = Math.floor((contextWindow - RESPONSE_RESERVE) * 0.6);
-                    const stats = this.compactWithHooks(target, 1);
+                    const stats = await this.compactWithHooks(target, 1);
                     // If compaction freed nothing, retrying will hit the same error.
                     // Surface the real failure instead of looping until exhaustion.
                     if (!stats || stats.after >= stats.before) {

package/dist/agent/conversation-state.d.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { ChatCompletionMessageParam } from "./llm-client.js";
+import type { ImageContent } from "./types.js";
 import { type NuclearEntry } from "./nuclear-form.js";
 import type { HandlerFunctions } from "../utils/handler-registry.js";
 /** Search hit shape returned by the `history:search` handler. */
@@ -51,7 +52,7 @@ export declare class ConversationState {
             arguments: string;
         };
     }[], extras?: Record<string, unknown>): void;
-    addToolResult(toolCallId: string, content: string, isError?: boolean): void;
+    addToolResult(toolCallId: string, content: string | ImageContent[], isError?: boolean): void;
     /** Add tool results as a user message (for inline tool protocol). */
     addToolResultInline(content: string): void;
     /** Safe from any context: queues if mid-tool-pair, appends otherwise. */
@@ -91,7 +92,7 @@ export declare class ConversationState {
     eagerNucleateTools(results: Array<{
         toolName: string;
         args: Record<string, unknown>;
-        content: string;
+        content: string | ImageContent[];
         isError: boolean;
     }>): void;
     /** Track an entry in memory (nuclear list + recall archive). */

package/dist/agent/conversation-state.js CHANGED Viewed

@@ -123,7 +123,23 @@ export class ConversationState {
         this.invalidateMessagesCache();
     }
     addToolResult(toolCallId, content, isError = false) {
-        this.messages.push({ role: "tool", tool_call_id: toolCallId, content });
+        if (typeof content === "string") {
+            this.messages.push({ role: "tool", tool_call_id: toolCallId, content });
+        }
+        else {
+            // Assembles OpenAI vision content parts for multimodal tool results.
+            // This format (array of text + image_url blocks on a tool message) is
+            // supported by OpenAI and most OpenAI-compatible providers. Providers
+            // that don't support it should not declare image modalities, so this
+            // path is only reached for providers known to handle it.
+            const parts = [];
+            for (const img of content) {
+                parts.push({ type: "image_url", image_url: { url: `data:${img.mimeType};base64,${img.data}` } });
+            }
+            const label = isError ? `Error: [${content.length} image(s)]` : `[${content.length} image(s)]`;
+            parts.unshift({ type: "text", text: label });
+            this.messages.push({ role: "tool", tool_call_id: toolCallId, content: parts });
+        }
         if (isError)
             this.toolErrors.add(toolCallId);
         this.invalidateMessagesCache();
@@ -311,11 +327,12 @@ export class ConversationState {
         const entries = [];
         for (const r of results) {
             const seq = this.nextSeq++;
-            const entry = this.handlers.call("conversation:nucleate-tool", r.toolName, r.args, r.content, r.isError, this.instanceId, seq);
+            const text = typeof r.content === "string" ? r.content : `[${r.content.length} image(s)]`;
+            const entry = this.handlers.call("conversation:nucleate-tool", r.toolName, r.args, text, r.isError, this.instanceId, seq);
             entries.push(entry);
             this.recordNuclearEntry(entry, [
                 { role: "assistant", content: null, tool_calls: [{ id: `seq_${seq}`, type: "function", function: { name: r.toolName, arguments: JSON.stringify(r.args) } }] },
-                { role: "tool", tool_call_id: `seq_${seq}`, content: r.content },
+                { role: "tool", tool_call_id: `seq_${seq}`, content: text },
             ]);
         }
         this.appendToHistory(entries);

package/dist/agent/events.d.ts CHANGED Viewed

@@ -99,6 +99,8 @@ declare module "../core/event-bus.js" {
         };
         "agent:tool-started": {
             title: string;
+            /** Canonical tool name; `title` is the display label and may differ. */
+            name?: string;
             toolCallId?: string;
             kind?: string;
             icon?: string;

package/dist/agent/host-types.d.ts CHANGED Viewed

@@ -51,6 +51,7 @@ export interface ProviderRegistration {
         contextWindow?: number;
         maxTokens?: number;
         echoReasoning?: boolean;
+        modalities?: ("text" | "image")[];
     })[];
     supportsReasoningEffort?: boolean;
     /** Local daemons etc. — `auth list/login` shows "no auth required". */
@@ -77,6 +78,8 @@ export interface AgentMode {
     /** Echo reasoning_content back on assistant turns. Required by DeepSeek;
      *  default off (leaky shims may forward it to the model as OOD input). */
     echoReasoning?: boolean;
+    /** Input modalities the model supports. Defaults to ["text"]. */
+    modalities?: ("text" | "image")[];
     buildReasoningParams?: (level: string) => Record<string, unknown>;
 }
 /**

package/dist/agent/index.js CHANGED Viewed

@@ -61,7 +61,7 @@ function splitRegistration(p) {
         }
         else {
             ids.push(m.id);
-            caps.set(m.id, { reasoning: m.reasoning, contextWindow: m.contextWindow, maxTokens: m.maxTokens, echoReasoning: m.echoReasoning });
+            caps.set(m.id, { reasoning: m.reasoning, contextWindow: m.contextWindow, maxTokens: m.maxTokens, echoReasoning: m.echoReasoning, modalities: m.modalities });
         }
     }
     return { ids, caps };
@@ -287,6 +287,7 @@ export default function agentBackend(ctx) {
                     reasoning: mc?.reasoning,
                     supportsReasoningEffort: p.supportsReasoningEffort,
                     echoReasoning: mc?.echoReasoning,
+                    modalities: mc?.modalities,
                     buildReasoningParams: bindReasoning(shapeId, model),
                 });
             }

package/dist/agent/subagent.d.ts CHANGED Viewed

@@ -11,7 +11,7 @@
  */
 import type { EventBus } from "../core/event-bus.js";
 import type { LlmClient } from "./llm-client.js";
-import type { ToolDefinition } from "./types.js";
+import { type ToolDefinition } from "./types.js";
 export interface SubagentOptions {
     /** LLM client to use. */
     llmClient: LlmClient;

package/dist/agent/subagent.js CHANGED Viewed

@@ -1,3 +1,4 @@
+import { contentText } from "./types.js";
 import { ConversationState } from "./conversation-state.js";
 import { normalizeToolArgs } from "./normalize-args.js";
 import { wrapTrailingWithDynamicContext } from "../utils/message-utils.js";
@@ -63,6 +64,7 @@ export async function runSubagent(opts) {
                 const display = tool.getDisplayInfo?.(args) ?? { kind: "execute" };
                 bus.emit("agent:tool-started", {
                     title: tc.name,
+                    name: tc.name,
                     toolCallId: tc.id,
                     kind: display.kind,
                     locations: display.locations,
@@ -84,7 +86,9 @@ export async function runSubagent(opts) {
                     resultDisplay,
                 });
             }
-            const content = result.isError ? `Error: ${result.content}` : result.content;
+            const content = result.isError
+                ? `Error: ${contentText(result.content)}`
+                : result.content;
             conversation.addToolResult(tc.id, content, !!result.isError);
         }
     }

package/dist/agent/tool-protocol.d.ts CHANGED Viewed

@@ -10,7 +10,7 @@
  * doesn't need to know which mode is active.
  */
 import type { ChatCompletionTool } from "./llm-client.js";
-import type { ToolDefinition } from "./types.js";
+import { type ToolDefinition } from "./types.js";
 import type { ConversationState } from "./conversation-state.js";
 export interface PendingToolCall {
     id: string;
@@ -20,7 +20,7 @@ export interface PendingToolCall {
 export interface ToolResult {
     callId: string;
     toolName: string;
-    content: string;
+    content: string | import("./types.js").ImageContent[];
     isError: boolean;
 }
 /** Streaming filter — strips tool calls from display output. */

package/dist/agent/tool-protocol.js CHANGED Viewed

@@ -1,3 +1,4 @@
+import { contentText } from "./types.js";
 // ── API mode (current behavior) ──────────────────────────────────
 export class ApiToolProtocol {
     mode = "api";
@@ -33,7 +34,7 @@ export class ApiToolProtocol {
     }
     recordResults(conv, results) {
         for (const r of results) {
-            const content = r.isError ? `Error: ${r.content}` : r.content;
+            const content = r.isError ? `Error: ${contentText(r.content)}` : r.content;
             conv.addToolResult(r.callId, content, r.isError);
         }
     }
@@ -105,7 +106,7 @@ export class InlineToolProtocol {
             return;
         const parts = results.map((r) => {
             const status = r.isError ? "error" : "ok";
-            return `[${r.toolName} ${r.callId} ${status}]\n${r.content}`;
+            return `[${r.toolName} ${r.callId} ${status}]\n${contentText(r.content)}`;
         });
         conv.addToolResultInline(parts.join("\n\n"));
     }
@@ -362,7 +363,7 @@ export class DeferredToolProtocol {
     }
     recordResults(conv, results) {
         for (const r of results) {
-            const content = r.isError ? `Error: ${r.content}` : r.content;
+            const content = r.isError ? `Error: ${contentText(r.content)}` : r.content;
             conv.addToolResult(r.callId, content, r.isError);
         }
     }
@@ -455,7 +456,7 @@ export class DeferredLookupProtocol {
     }
     recordResults(conv, results) {
         for (const r of results) {
-            const content = r.isError ? `Error: ${r.content}` : r.content;
+            const content = r.isError ? `Error: ${contentText(r.content)}` : r.content;
             conv.addToolResult(r.callId, content, r.isError);
         }
     }

package/dist/agent/tools/glob.d.ts CHANGED Viewed

@@ -1,2 +1,2 @@
-import type { ToolDefinition } from "../types.js";
+import { type ToolDefinition } from "../types.js";
 export declare function createGlobTool(getCwd: () => string): ToolDefinition;

package/dist/agent/tools/glob.js CHANGED Viewed

@@ -2,6 +2,7 @@ import * as fs from "node:fs/promises";
 import * as path from "node:path";
 import { executeArgv } from "../../utils/executor.js";
 import { resolveRgPath } from "../../utils/ripgrep-path.js";
+import { contentText } from "../types.js";
 import { expandHome } from "./expand-home.js";
 export function createGlobTool(getCwd) {
     return {
@@ -27,9 +28,10 @@ export function createGlobTool(getCwd) {
         },
         showOutput: false,
         formatResult: (_args, result) => {
-            if (result.isError || result.content === "No files matched.")
+            const text = contentText(result.content);
+            if (result.isError || text === "No files matched.")
                 return { summary: "0 files" };
-            const lines = result.content.split("\n").filter(l => l && !l.startsWith("["));
+            const lines = text.split("\n").filter(l => l && !l.startsWith("["));
             return { summary: `${lines.length} files` };
         },
         getDisplayInfo: (args) => ({

package/dist/agent/tools/grep.d.ts CHANGED Viewed

@@ -1,2 +1,2 @@
-import type { ToolDefinition } from "../types.js";
+import { type ToolDefinition } from "../types.js";
 export declare function createGrepTool(getCwd: () => string): ToolDefinition;

package/dist/agent/tools/grep.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import { executeArgv } from "../../utils/executor.js";
 import { resolveRgPath } from "../../utils/ripgrep-path.js";
+import { contentText } from "../types.js";
 import { expandHome } from "./expand-home.js";
 export function createGrepTool(getCwd) {
     return {
@@ -58,9 +59,10 @@ export function createGrepTool(getCwd) {
         },
         showOutput: false,
         formatResult: (args, result) => {
-            if (result.isError || result.content === "No matches found.")
+            const text = contentText(result.content);
+            if (result.isError || text === "No matches found.")
                 return { summary: "0 matches" };
-            const lines = result.content.split("\n").filter(Boolean);
+            const lines = text.split("\n").filter(Boolean);
             // Strip pagination info line from count
             const resultLines = lines.filter(l => !l.startsWith("[Showing "));
             const mode = args.output_mode ?? "files_with_matches";

package/dist/agent/tools/ls.d.ts CHANGED Viewed

@@ -1,2 +1,2 @@
-import type { ToolDefinition } from "../types.js";
+import { type ToolDefinition } from "../types.js";
 export declare function createLsTool(getCwd: () => string): ToolDefinition;

package/dist/agent/tools/ls.js CHANGED Viewed

@@ -1,5 +1,6 @@
 import * as fs from "node:fs/promises";
 import * as path from "node:path";
+import { contentText } from "../types.js";
 import { expandHome } from "./expand-home.js";
 function formatSize(bytes) {
     if (bytes < 1024)
@@ -33,9 +34,10 @@ export function createLsTool(getCwd) {
                 : [],
         }),
         formatResult: (_args, result) => {
-            if (result.isError || result.content === "(empty directory)")
+            const text = contentText(result.content);
+            if (result.isError || text === "(empty directory)")
                 return { summary: "0 entries" };
-            const lines = result.content.split("\n").filter(Boolean);
+            const lines = text.split("\n").filter(Boolean);
             return { summary: `${lines.length} entries` };
         },
         async execute(args) {

package/dist/agent/tools/read-file.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import type { ToolDefinition } from "../types.js";
+import { type ToolDefinition } from "../types.js";
 /** Tracks the last-read state of a file for deduplication. */
 export interface FileReadState {
     mtimeMs: number;

package/dist/agent/tools/read-file.js CHANGED Viewed

@@ -1,6 +1,14 @@
 import * as fs from "node:fs/promises";
 import * as path from "node:path";
+import { contentText } from "../types.js";
 import { expandHome } from "./expand-home.js";
+const IMAGE_MIME_TYPES = {
+    ".png": "image/png",
+    ".jpg": "image/jpeg",
+    ".jpeg": "image/jpeg",
+    ".gif": "image/gif",
+    ".webp": "image/webp",
+};
 export function createReadFileTool(getCwd, cache) {
     return {
         name: "read_file",
@@ -32,11 +40,12 @@ export function createReadFileTool(getCwd, cache) {
             locations: [{ path: args.path }],
         }),
         formatResult: (_args, result) => {
+            const text = contentText(result.content);
             if (result.isError)
                 return {};
-            if (result.content.startsWith("File unchanged"))
+            if (text.startsWith("File unchanged"))
                 return { summary: "cached" };
-            const lines = result.content.split("\n").filter(l => !l.startsWith("["));
+            const lines = text.split("\n").filter(l => !l.startsWith("["));
             return { summary: `${lines.length} lines` };
         },
         async execute(args) {
@@ -72,6 +81,25 @@ export function createReadFileTool(getCwd, cache) {
                         isError: true,
                     };
                 }
+                const ext = path.extname(absPath).toLowerCase();
+                const mimeType = IMAGE_MIME_TYPES[ext];
+                if (mimeType) {
+                    const MAX_IMAGE_BYTES = 5 * 1024 * 1024; // 5MB — base64 adds ~33%
+                    if (stat.size > MAX_IMAGE_BYTES) {
+                        return {
+                            content: `Image is ${(stat.size / (1024 * 1024)).toFixed(1)}MB — too large. Images are capped at 5MB.`,
+                            exitCode: 1,
+                            isError: true,
+                        };
+                    }
+                    const buf = await fs.readFile(absPath);
+                    const data = buf.toString("base64");
+                    return {
+                        content: [{ type: "image", data, mimeType }],
+                        exitCode: 0,
+                        isError: false,
+                    };
+                }
                 const content = await fs.readFile(absPath, "utf-8");
                 const lines = content.split("\n");
                 const start = reqOffset - 1; // 1-indexed → 0-indexed

package/dist/agent/types.d.ts CHANGED Viewed

@@ -15,8 +15,18 @@ export interface AgentBackend {
     start?(): Promise<void>;
     kill(): void;
 }
+/** Image content block for multimodal tool results. */
+export interface ImageContent {
+    type: "image";
+    /** Base64-encoded image data (no data: URL prefix). */
+    data: string;
+    /** MIME type (e.g. "image/png", "image/jpeg"). */
+    mimeType: string;
+}
+/** Extract the text portion of a tool result's content. Returns "" for image-only results. */
+export declare function contentText(content: string | ImageContent[]): string;
 export interface ToolResult {
-    content: string;
+    content: string | ImageContent[];
     exitCode: number | null;
     isError: boolean;
     /** When set, takes precedence over `tool.formatResult()`. */

package/dist/agent/types.js CHANGED Viewed

@@ -1 +1,6 @@
-export {};
+/** Extract the text portion of a tool result's content. Returns "" for image-only results. */
+export function contentText(content) {
+    if (typeof content === "string")
+        return content;
+    return content.map(c => `[image: ${c.mimeType}]`).join("\n");
+}

package/dist/cli/index.js CHANGED Viewed

File without changes

package/dist/core/index.d.ts CHANGED Viewed

@@ -17,7 +17,7 @@ export type { AgentContext, AgentConfig, AgentSurface, AgentConfigSurface, Agent
 export type { ShellContext, ShellConfig, ShellSurface, ShellConfigSurface, ExtensionContext, RemoteSession, RemoteSessionOptions, RenderSurface, InputModeConfig, TerminalSession, BlockTransformOptions, FencedBlockTransformOptions, AppConfig } from "../shell/host-types.js";
 export { palette, setPalette, resetPalette } from "../utils/palette.js";
 export type { ColorPalette } from "../utils/palette.js";
-export type { AgentBackend, ToolDefinition } from "../agent/types.js";
+export type { AgentBackend, ToolDefinition, ImageContent } from "../agent/types.js";
 export { runSubagent, type SubagentOptions } from "../agent/subagent.js";
 export { LlmClient } from "../agent/llm-client.js";
 export { HistoryFile, InMemoryHistory, NoopHistory, type HistoryAdapter } from "../agent/history-file.js";

package/dist/core/settings.d.ts CHANGED Viewed

@@ -13,6 +13,8 @@ export interface ModelCapabilityConfig {
     maxTokens?: number;
     /** Echo reasoning_content back on assistant turns. Required by DeepSeek. */
     echoReasoning?: boolean;
+    /** Content modalities the model supports (e.g. ["text", "image"]). */
+    modalities?: ("text" | "image")[];
 }
 /** Provider profile — a named LLM configuration. */
 export interface ProviderConfig {
@@ -163,6 +165,7 @@ export interface ResolvedProvider {
         contextWindow?: number;
         maxTokens?: number;
         echoReasoning?: boolean;
+        modalities?: ("text" | "image")[];
     }>;
     /** Borrow another registered provider's reasoning request shape by id. */
     reasoningShape?: string;

package/dist/core/settings.js CHANGED Viewed

@@ -150,8 +150,8 @@ export function resolveProvider(name) {
         }
         else {
             modelIds.push(m.id);
-            if (m.reasoning !== undefined || m.contextWindow !== undefined || m.maxTokens !== undefined || m.echoReasoning !== undefined) {
-                caps.set(m.id, { reasoning: m.reasoning, contextWindow: m.contextWindow, maxTokens: m.maxTokens, echoReasoning: m.echoReasoning });
+            if (m.reasoning !== undefined || m.contextWindow !== undefined || m.maxTokens !== undefined || m.echoReasoning !== undefined || m.modalities !== undefined) {
+                caps.set(m.id, { reasoning: m.reasoning, contextWindow: m.contextWindow, maxTokens: m.maxTokens, echoReasoning: m.echoReasoning, modalities: m.modalities });
             }
         }
     }

package/dist/shell/index.d.ts CHANGED Viewed

@@ -5,6 +5,7 @@
  */
 import "./events.js";
 import type { ExtensionContext } from "./host-types.js";
+import { type Terminal } from "./terminal.js";
 export interface ShellActivateOptions {
     cols: number;
     rows: number;
@@ -16,6 +17,11 @@ export interface ShellActivateOptions {
         info: string;
         model?: string;
     };
+    /**
+     * Host-side I/O endpoint. Defaults to processTerminal() so the CLI
+     * works unchanged; headless callers (web hubs, tests) supply their own.
+     */
+    terminal?: Terminal;
 }
 export interface ShellHandle {
     /** Terminate the PTY. */