npm - agent-sh - Versions diffs - 0.14.9 → 0.14.11 - Mend

agent-sh 0.14.9 → 0.14.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

package/README.md +47 -20
package/dist/agent/agent-loop.js +20 -15
package/dist/agent/events.d.ts +2 -1
package/dist/agent/index.js +44 -7
package/dist/agent/live-view.d.ts +3 -3
package/dist/agent/live-view.js +15 -7
package/dist/agent/providers/ollama.d.ts +11 -0
package/dist/agent/providers/ollama.js +72 -0
package/dist/agent/providers/opencode.d.ts +10 -0
package/dist/agent/providers/opencode.js +112 -0
package/dist/agent/providers/openrouter.js +9 -0
package/dist/agent/providers/zai-coding-plan.d.ts +5 -0
package/dist/agent/providers/zai-coding-plan.js +26 -0
package/dist/agent/subagent.js +1 -1
package/dist/cli/args.js +2 -2
package/dist/cli/install.js +10 -1
package/dist/shell/events.d.ts +3 -0
package/dist/shell/shell.js +3 -0
package/dist/utils/diff-renderer.d.ts +4 -0
package/dist/utils/diff-renderer.js +15 -20
package/examples/extensions/ads/SKILL.md +170 -0
package/examples/extensions/ads/index.ts +695 -0
package/examples/extensions/ash-scheme/index.ts +339 -605
package/examples/extensions/ash-scheme/package.json +1 -1
package/examples/extensions/ashi/EXTENDING.md +116 -0
package/examples/extensions/ashi/README.md +10 -54
package/examples/extensions/ashi/package.json +6 -2
package/examples/extensions/ashi/src/autocomplete-controller.ts +95 -0
package/examples/extensions/ashi/src/autocomplete.ts +1 -23
package/examples/extensions/ashi/src/capture.ts +9 -3
package/examples/extensions/ashi/src/chat/assistant.ts +87 -0
package/examples/extensions/ashi/src/chat/lines.ts +20 -0
package/examples/extensions/ashi/src/chat/thinking.ts +42 -0
package/examples/extensions/ashi/src/chat/tool-group.ts +84 -0
package/examples/extensions/ashi/src/chat/user-message.ts +20 -0
package/examples/extensions/ashi/src/cli.ts +58 -12
package/examples/extensions/ashi/src/clipboard-image.ts +41 -0
package/examples/extensions/ashi/src/commands.ts +11 -1
package/examples/extensions/ashi/src/display-config.ts +9 -1
package/examples/extensions/ashi/src/frontend.ts +340 -259
package/examples/extensions/ashi/src/hooks.ts +33 -40
package/examples/extensions/ashi/src/renderer.ts +222 -0
package/examples/extensions/ashi/src/renderers/pi-tui/app.ts +122 -0
package/examples/extensions/ashi/src/renderers/pi-tui/index.ts +23 -0
package/examples/extensions/ashi/src/renderers/pi-tui/nodes.ts +133 -0
package/examples/extensions/ashi/src/renderers/pi-tui/schema-mount.ts +193 -0
package/examples/extensions/ashi/src/renderers/pi-tui/theme-adapters.ts +48 -0
package/examples/extensions/ashi/src/renderers/pi-tui/tool-group.ts +21 -0
package/examples/extensions/ashi/src/schema.ts +43 -205
package/examples/extensions/ashi/src/status-footer.ts +15 -23
package/examples/extensions/ashi/src/terminal-mode.ts +9 -0
package/examples/extensions/ashi/src/theme.ts +1 -47
package/examples/extensions/ashi-ink/README.md +59 -0
package/examples/extensions/ashi-ink/package.json +30 -0
package/examples/extensions/ashi-ink/src/index.ts +6 -0
package/examples/extensions/ashi-ink/src/ink-renderer.tsx +865 -0
package/examples/extensions/ashi-ink/src/shims.d.ts +5 -0
package/examples/extensions/ashi-ink/test/render.test.tsx +408 -0
package/examples/extensions/ashi-ink/tsconfig.json +14 -0
package/examples/extensions/ashi-scheme-render.ts +4 -10
package/examples/extensions/ashi-shell-passthrough.ts +95 -0
package/examples/extensions/latex-images.ts +22 -19
package/examples/extensions/terminal-buffer.ts +4 -2
package/package.json +3 -9
package/examples/extensions/ashi/src/components.ts +0 -238
package/examples/extensions/ollama.ts +0 -108
package/examples/extensions/opencode-provider.ts +0 -251
package/examples/extensions/zai-coding-plan.ts +0 -35

package/README.md CHANGED Viewed

@@ -1,15 +1,19 @@
 # agent-sh
-A real shell with an AI agent one keystroke away.
 [![npm version](https://img.shields.io/npm/v/agent-sh.svg)](https://www.npmjs.com/package/agent-sh)
 [![license](https://img.shields.io/npm/l/agent-sh.svg)](https://github.com/guanyilun/agent-sh/blob/main/LICENSE)
-![demo](assets/demo.gif)
+A composable agent runtime — pair any frontend with any agent backend, over one shared extension layer.
+## Three example apps built on agent-sh
-I live in my terminal. A lot of the time I'm not coding — I'm deploying something, poking at a failing `rsync`, figuring out why `docker build` won't start, fixing a one-liner. And very often I need an AI agent to help. Spinning up a full coding agent for this stuff is overkill, and I got tired of copy-pasting errors into a chat window every time.
+agent-sh is small at its core and does its real work through extensions, so the same runtime drives very different apps. Three to start with — all sharing the same agent backends, tools, providers, and `~/.agent-sh/settings.json`:
-So I built agent-sh. Under the hood it's a normal shell on top of node-pty — your rc config, your aliases, vim and tmux all just work. But at the start of any line, type `>` and you're talking to a small agent that already sees your cwd, your last command, and its output. Nothing to set up, no project to explain.
+### 1. A shell with the agent one keystroke away — bundled with agent-sh
+A normal shell on top of node-pty — your rc config, your aliases, vim and tmux all just work. But at the start of any line, type `>` and you're talking to a small agent that already sees your cwd, your last command, and its output. Nothing to set up, no project to explain.
+![demo](assets/demo.gif)
 ```
 ~ $ ls -la                       # real shell command
@@ -19,10 +23,47 @@ So I built agent-sh. Under the hood it's a normal shell on top of node-pty — y
 ~ $ > draft a commit message     # agent reads your diff and shell history
 ```
-agent-sh is built to be agent-agnostic. The recommended path is the built-in agent `ash` — a lightweight agent designed so extensions can plug into the same tool surface. If you'd rather host an existing coding agent (pi, claude-code, opencode), you can [bring your own](#bring-your-own-agent) — with the trade-off that it manages its own separate tools.
+```bash
+npm install -g agent-sh
+```
+[Quick Start ↓](#quick-start)
+### 2. ashi — a standalone coding agent
+[**`@guanyilun/ashi`**](examples/extensions/ashi/) is the same `ash` agent in a chat-style TUI, with no shell underneath — just the agent. Installed separately, it reuses agent-sh's backend, tools, slash commands, providers, and skills, and adds session history, in-session branching, and LLM-driven compaction.
+```bash
+npm install -g @guanyilun/ashi
+ashi
+```
+ashi makes the runtime's **decoupled rendering** concrete: the frontend is itself an extension, and even *how* it draws tool calls and results is a swappable render extension. Same agent backend, same conversation — load a different render extension and the whole TUI restyles, no code changes:
+| pi-style rendering | claude-code-style rendering |
+|---|---|
+| ![ashi rendering tool calls pi-style](assets/ashi-pi-style.png) | ![ashi rendering tool calls claude-code-style](assets/ashi-claude-code-style.png) |
+### 3. asHub — a GUI coding agent
+[**firslov/asHub**](https://github.com/firslov/asHub) is a third-party cross-platform desktop app (Electron) built on the agent-sh runtime: a multi-session sidebar, persistence across restarts, and a live-streaming interface with Markdown, syntax-highlighted code, diffs, and tool-call rendering. macOS / Windows / Linux.
+It pushes the same decoupling one step further — the frontend isn't a terminal at all, but a full desktop GUI on the same runtime, backends, and tools:
+![asHub desktop GUI](assets/ashub.png)
+## How it works
+agent-sh is a **composable agent runtime**. At its center is a pure kernel — a typed event bus, a named-handler registry, and an extension loader — that knows nothing about terminals, LLMs, shells, or rendering. Everything else plugs into it: the agent backend, its tools, provider management, and the frontend that drives it.
+The frontend and the agent backend are both just components on the bus, so you **mix and match** them freely — wire several frontends to one backend, or keep one frontend and swap the backend underneath — all sharing the **same extension layer** of tools, content transforms, slash commands, and themes. `import { createCore } from "agent-sh"` gives you the headless kernel; load the pieces you want and wire your own I/O.
+For the kernel design in full — the bus, handlers, the compositor, and the shell ↔ agent boundary — see [Architecture](docs/architecture.md). To embed the runtime in your own frontend, see the [Library Guide](docs/library.md). The rest of this README covers the bundled shell.
 ## Quick Start
+**This sets up the agent-sh shell** — the frontend bundled in the `agent-sh` package. (For the other frontends, install [ashi](examples/extensions/ashi/) or [asHub](https://github.com/firslov/asHub) instead.)
 ### Installation
 Install from npm:
@@ -139,20 +180,6 @@ All three bridges receive agent-sh's per-query shell context (`<shell_events>`)
 **Caveat:** pi, claude-code, and opencode each manage their own tool surfaces, so agent-sh extensions that register tools (or skills, instructions, etc.) for the built-in `ash` agent generally won't be visible to a hosted backend. Frontend extensions (themes, content transforms, slash commands, the TUI renderer) keep working — only the agent-side capabilities differ. Use the bridges when you want that agent's toolset; stay on `ash` when you want agent-sh's extension ecosystem.
-## Key Features
-**Real terminal, zero compromise.** Full PTY with your shell config, aliases, and environment. Shell starts instantly — the agent connects asynchronously in the background.
-**One entry point, smart tool selection.** Type `>` and agent-sh figures out how to help. Scratchpad tools (`bash`, `read_file`, `grep`, `glob`) for investigation. Extensions add capabilities like running commands in your live shell. No modes to pick — the agent reasons about which tools to use based on your intent.
-**Context that just works.** Every query includes your cwd, recent commands, and their output. Run a failing test, type `> fix this`, and agent-sh knows exactly what happened. Context management works like shell history — continuous, persistent across restarts, no sessions to manage. See [Context Management](docs/context-management.md).
-**Any LLM, any backend.** agent-sh works with any OpenAI-compatible API out of the box. Define multiple providers in settings and switch models at runtime with `/model <name>`. Or swap in a completely different agent — bundled bridges run [pi](examples/extensions/pi-bridge/), [claude-code](examples/extensions/claude-code-bridge/), or [opencode](examples/extensions/opencode-bridge/) as a drop-in backend (see [Bring your own agent](#bring-your-own-agent)).
-**Extensible by design.** The entire system is built on a typed event bus. Extensions can add custom input modes, content transforms (render LaTeX as images, Mermaid as diagrams), themes, slash commands, or replace the agent backend entirely. The built-in TUI renderer is itself just an extension.
-**Embeddable as a library.** The core is a headless kernel — `import { createCore } from "agent-sh"` to build WebSocket servers, REST APIs, Electron apps, or test harnesses. No terminal required.
 ## Documentation
 Start with **Usage** to get running, then **Architecture** for the mental model.

package/dist/agent/agent-loop.js CHANGED Viewed

@@ -135,8 +135,8 @@ export class AgentLoop {
             }
             return acc;
         });
-        on("agent:submit", ({ query }) => {
-            this.handleQuery(query).catch(() => { });
+        on("agent:submit", ({ query, images }) => {
+            this.handleQuery(query, images).catch(() => { });
         });
         on("agent:cancel-request", (e) => {
             this.abortController?.abort(e.silent ? "silent" : undefined);
@@ -260,7 +260,7 @@ export class AgentLoop {
             budgetTokens: this.currentMode.contextWindow ?? DEFAULT_CONTEXT_WINDOW,
         }));
         onPipe("context:snapshot", (payload) => {
-            payload.messages = this.conversation.getMessages();
+            payload.messages = this.conversation.get();
             payload.contextWindow = this.currentMode.contextWindow ?? DEFAULT_CONTEXT_WINDOW;
             payload.activeTokens = this.conversation.estimateTokens();
             return payload;
@@ -657,12 +657,10 @@ export class AgentLoop {
         // filter, reorder, inject — whatever strategy fits.
         h.define("conversation:prepare", (messages) => messages);
         // ── Conversation primitives for compaction strategies ─────────
-        // Read messages (for inspection / computing new arrays) and replace
-        // the whole array (write side). Extensions implementing
-        // `conversation:compact` use these to observe and mutate.
-        h.define("conversation:get-messages", () => this.conversation.getMessages());
+        // Canonical array (link/replace index space), not forLLM().
+        h.define("conversation:get-messages", () => this.conversation.get());
         h.define("conversation:replace-messages", (msgs) => {
-            this.conversation.replaceMessages(msgs);
+            this.conversation.replace(msgs);
         });
         h.define("conversation:estimate-tokens", () => this.conversation.estimateTokens());
         h.define("conversation:estimate-prompt-tokens", () => this.conversation.estimatePromptTokens());
@@ -671,13 +669,13 @@ export class AgentLoop {
             const strategy = opts.strategy;
             if (strategy?.kind === "rewind" || strategy?.kind === "replace") {
                 const before = this.conversation.estimatePromptTokens();
-                const beforeLen = this.conversation.getMessages().length;
+                const beforeLen = this.conversation.get().length;
                 const next = strategy.kind === "rewind"
-                    ? this.conversation.getMessages().slice(0, strategy.toIndex)
+                    ? this.conversation.get().slice(0, strategy.toIndex)
                     : strategy.messages;
-                this.conversation.replaceMessages(next);
+                this.conversation.replace(next);
                 const after = this.conversation.estimatePromptTokens();
-                const afterLen = this.conversation.getMessages().length;
+                const afterLen = this.conversation.get().length;
                 return { before, after, evictedCount: Math.max(0, beforeLen - afterLen) };
             }
             return null;
@@ -755,7 +753,7 @@ export class AgentLoop {
             return result;
         });
     }
-    async handleQuery(query) {
+    async handleQuery(query, images) {
         // Cancel any in-flight loop (concurrent prompt handling)
         if (this.abortController) {
             this.abortController.abort();
@@ -778,7 +776,14 @@ export class AgentLoop {
             const userContent = queryContext
                 ? `<query_context>\n${queryContext}\n</query_context>\n\n${query}`
                 : query;
-            this.conversation.addUserMessage(userContent);
+            // Fail closed: an image sent to a non-vision model errors and leaves an
+            // unsendable message poisoning history, so require declared image support.
+            let userImages = images?.length ? images : undefined;
+            if (userImages && !this.currentMode.modalities?.includes("image")) {
+                this.bus.emit("ui:info", { message: `Current model has no declared image support — ${userImages.length} image(s) dropped.` });
+                userImages = undefined;
+            }
+            this.conversation.addUserMessage(userContent, userImages);
             this.bus.emit("conversation:message-appended", { role: "user", content: query });
             responseText = await this.executeLoop(signal);
         }
@@ -1262,7 +1267,7 @@ export class AgentLoop {
         // wrapTrailingWithDynamicContext for the cache-stability rationale.
         const rawMessages = [
             { role: "system", content: systemPrompt },
-            ...wrapTrailingWithDynamicContext(this.conversation.getMessages(), dynamicContext, toolPrompt),
+            ...wrapTrailingWithDynamicContext(this.conversation.forLLM(), dynamicContext, toolPrompt),
         ];
         // Let extensions transform the message array (compact, summarize, filter, etc.)
         const messages = this.handlers.call("conversation:prepare", rawMessages);

package/dist/agent/events.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import type { ProviderRegistration } from "./host-types.js";
-import type { ToolDefinition, ToolResultDisplay } from "./types.js";
+import type { ImageContent, ToolDefinition, ToolResultDisplay } from "./types.js";
 export interface AgentIdentity {
     name: string;
     version: string;
@@ -44,6 +44,7 @@ declare module "../core/event-bus.js" {
         };
         "agent:submit": {
             query: string;
+            images?: ImageContent[];
         };
         "agent:cancel-request": {
             silent?: boolean;

package/dist/agent/index.js CHANGED Viewed

@@ -14,6 +14,9 @@ import activateOpenrouter from "./providers/openrouter.js";
 import activateOpenai from "./providers/openai.js";
 import activateOpenaiCompatible from "./providers/openai-compatible.js";
 import activateDeepseek from "./providers/deepseek.js";
+import activateOllama from "./providers/ollama.js";
+import activateZaiCodingPlan from "./providers/zai-coding-plan.js";
+import activateOpencode from "./providers/opencode.js";
 import { findBash } from "../utils/executor.js";
 import { createBashTool } from "./tools/bash.js";
 import { createPwshTool } from "./tools/pwsh.js";
@@ -29,6 +32,12 @@ function persistedModelFor(providerName) {
         return undefined;
     return getSettings().providers?.[providerName]?.defaultModel;
 }
+/** The OpenAI SDK silently defaults an empty baseURL to api.openai.com, so a
+ *  provider with a key but no endpoint would misroute its key there. `openai`
+ *  is exempt: that default is its endpoint. */
+function usableProvider(p) {
+    return !!p?.apiKey && (!!p.baseURL || p.id === "openai");
+}
 function defaultReasoningBuilder(level) {
     if (level === "off")
         return {};
@@ -276,6 +285,8 @@ export default function agentBackend(ctx) {
         for (const [id, p] of resolvedProviders) {
             if (!p.apiKey)
                 continue;
+            if (!usableProvider(p))
+                continue;
             const shapeId = p.reasoningShape ?? id;
             for (const model of p.models) {
                 const mc = p.modelCapabilities?.get(model);
@@ -344,13 +355,32 @@ export default function agentBackend(ctx) {
         loadedExtensionNames = names;
         resolvedProviders = computeResolvedProviders();
         const settings = getSettings();
-        // Built-ins register unconditionally so `auth list` can enumerate them;
-        // the fallback must skip keyless entries or it lands on openrouter and
-        // bails at the `!effectiveApiKey` guard below.
-        const providerName = config.provider
-            ?? settings.defaultProvider
-            ?? [...resolvedProviders].find(([, p]) => p.apiKey)?.[0];
-        const activeProvider = providerName ? resolvedProviders.get(providerName) ?? null : null;
+        let providerName = config.provider ?? settings.defaultProvider;
+        let activeProvider = providerName ? resolvedProviders.get(providerName) ?? null : null;
+        // Inline CLI credentials carry their own endpoint, so they skip the
+        // usable-provider fallback that registry-driven selection needs.
+        if (!config.apiKey) {
+            if (!providerName) {
+                const first = [...resolvedProviders].find(([, p]) => usableProvider(p));
+                providerName = first?.[0];
+                activeProvider = first?.[1] ?? null;
+            }
+            else if (!usableProvider(activeProvider)) {
+                const reason = !activeProvider ? "is not registered"
+                    : !activeProvider.apiKey ? "has no API key configured"
+                        : "has no endpoint configured";
+                const next = [...resolvedProviders].find(([, p]) => usableProvider(p));
+                if (next) {
+                    bus.emit("ui:error", { message: `Provider "${providerName}" ${reason}; falling back to "${next[0]}".` });
+                    providerName = next[0];
+                    activeProvider = next[1];
+                }
+                else {
+                    bus.emit("ui:error", { message: `Provider "${providerName}" ${reason}, and no other configured provider has both an API key and an endpoint. Run \`agent-sh auth\` to configure one.` });
+                    return;
+                }
+            }
+        }
         // Persisted defaultModel wins over openrouter's hardcoded DEFAULT_MODELS[0].
         const effectiveApiKey = config.apiKey ?? activeProvider?.apiKey;
         const effectiveBaseURL = config.baseURL ?? activeProvider?.baseURL;
@@ -465,6 +495,10 @@ export default function agentBackend(ctx) {
             bus.emit("ui:error", { message: `Provider "${name}" has no API key configured` });
             return;
         }
+        if (!p.baseURL && p.id !== "openai") {
+            bus.emit("ui:error", { message: `Provider "${name}" has no endpoint configured` });
+            return;
+        }
         const switchModel = p.defaultModel ?? p.models[0];
         if (!switchModel) {
             bus.emit("ui:error", { message: `Provider "${name}" has no models configured` });
@@ -501,4 +535,7 @@ export function activateAgent(ctx) {
     if (process.env.OPENAI_BASE_URL)
         activateOpenaiCompatible(agentCtx);
     activateDeepseek(agentCtx);
+    activateOllama(agentCtx);
+    activateZaiCodingPlan(agentCtx);
+    activateOpencode(agentCtx);
 }

package/dist/agent/live-view.d.ts CHANGED Viewed

@@ -19,7 +19,7 @@ export declare class LiveView {
     constructor(handlers?: HandlerFunctions, instanceId?: string);
     private getMessagesJson;
     private invalidateMessagesCache;
-    addUserMessage(text: string): void;
+    addUserMessage(text: string, images?: ImageContent[]): void;
     addAssistantMessage(content: string | null, toolCalls?: {
         id: string;
         function: {
@@ -34,9 +34,9 @@ export declare class LiveView {
     appendUserMessage(text: string): void;
     private hasOpenToolCalls;
     private flushPendingMessages;
-    getMessages(): ChatCompletionMessageParam[];
-    get(): AgentShMessage[];
+    /** Send-shaped; may be longer than get() (dangling calls stubbed) — never link()/replace() by these indices. */
     forLLM(): ChatCompletionMessageParam[];
+    get(): AgentShMessage[];
     replace(msgs: AgentShMessage[]): void;
     link(index: number, entryId: string): void;
     /** DeepSeek 400s on tool messages without a matching tool_call;

package/dist/agent/live-view.js CHANGED Viewed

@@ -1,4 +1,3 @@
-import { stripMeta } from "./llm-client.js";
 export class LiveView {
     messages = [];
     messagesDirty = true;
@@ -26,8 +25,19 @@ export class LiveView {
         this.messagesDirty = true;
         this.cachedMessagesJson = null;
     }
-    addUserMessage(text) {
-        this.messages.push({ role: "user", content: text });
+    addUserMessage(text, images) {
+        if (images?.length) {
+            const parts = [];
+            if (text)
+                parts.push({ type: "text", text });
+            for (const img of images) {
+                parts.push({ type: "image_url", image_url: { url: `data:${img.mimeType};base64,${img.data}` } });
+            }
+            this.messages.push({ role: "user", content: parts });
+        }
+        else {
+            this.messages.push({ role: "user", content: text });
+        }
         this.invalidateMessagesCache();
     }
     addAssistantMessage(content, toolCalls, extras) {
@@ -131,15 +141,13 @@ export class LiveView {
         }
         this.invalidateMessagesCache();
     }
-    getMessages() {
+    /** Send-shaped; may be longer than get() (dangling calls stubbed) — never link()/replace() by these indices. */
+    forLLM() {
         return this.normalizeReasoningConsistency(this.stubDanglingToolCalls(this.dropOrphanToolMessages(this.messages)));
     }
     get() {
         return this.messages;
     }
-    forLLM() {
-        return this.getMessages().map(stripMeta);
-    }
     replace(msgs) {
         this.replaceMessages(msgs);
     }

package/dist/agent/providers/ollama.d.ts ADDED Viewed

@@ -0,0 +1,11 @@
+/**
+ * Ollama provider — local daemon or Ollama Cloud.
+ *
+ * Cloud auth:  agent-sh auth login ollama-cloud
+ * Local host:  OLLAMA_HOST (default http://localhost:11434)
+ *
+ * Catalog comes from /api/tags; per-model context length is fetched
+ * from /api/show. Chat goes through the OpenAI-compatible /v1 shim.
+ */
+import type { AgentContext } from "../host-types.js";
+export default function activate(ctx: AgentContext): void;

package/dist/agent/providers/ollama.js ADDED Viewed

@@ -0,0 +1,72 @@
+import { resolveApiKey } from "../../cli/auth/keys.js";
+const ECHO_REASONING_PATTERNS = [/deepseek/i];
+export default function activate(ctx) {
+    const cloudKey = resolveApiKey("ollama-cloud").key ?? process.env.OLLAMA_API_KEY;
+    const host = cloudKey
+        ? "https://ollama.com"
+        : (process.env.OLLAMA_HOST ?? "http://localhost:11434").replace(/\/$/, "");
+    const id = cloudKey ? "ollama-cloud" : "ollama";
+    const sdkKey = cloudKey || "no-key";
+    const noAuth = !cloudKey;
+    const baseURL = `${host}/v1`;
+    const headers = {};
+    if (cloudKey)
+        headers.Authorization = `Bearer ${cloudKey}`;
+    ctx.agent.providers.configure(id, {
+        reasoningParams: (level) => {
+            if (level === "off")
+                return { reasoning_effort: "none" };
+            return { reasoning_effort: level === "xhigh" ? "high" : level };
+        },
+    });
+    ctx.agent.providers.register({ id, apiKey: sdkKey, baseURL, models: [], noAuth });
+    fetchCatalog(host, headers).then((models) => {
+        if (models.length === 0)
+            return;
+        ctx.agent.providers.register({
+            id,
+            apiKey: sdkKey,
+            baseURL,
+            defaultModel: models[0].id,
+            models,
+            noAuth,
+        });
+    }).catch(() => { });
+}
+async function fetchCatalog(host, headers) {
+    const tagsRes = await fetch(`${host}/api/tags`, { headers });
+    if (!tagsRes.ok)
+        return [];
+    const tagsData = await tagsRes.json();
+    const names = (tagsData.models ?? []).map((m) => m.name);
+    if (names.length === 0)
+        return [];
+    const ctxs = await Promise.all(names.map((name) => fetchContextLength(host, headers, name).catch(() => undefined)));
+    return names.map((name, i) => ({
+        id: name,
+        contextWindow: ctxs[i],
+        echoReasoning: ECHO_REASONING_PATTERNS.some((re) => re.test(name)),
+    }));
+}
+async function fetchContextLength(host, headers, name) {
+    const res = await fetch(`${host}/api/show`, {
+        method: "POST",
+        headers: { ...headers, "Content-Type": "application/json" },
+        body: JSON.stringify({ name }),
+    });
+    if (!res.ok)
+        return undefined;
+    const data = await res.json();
+    const info = data.model_info ?? {};
+    const arch = info["general.architecture"];
+    if (arch) {
+        const ctx = info[`${arch}.context_length`];
+        if (typeof ctx === "number")
+            return ctx;
+    }
+    for (const [k, v] of Object.entries(info)) {
+        if (k.endsWith(".context_length") && typeof v === "number")
+            return v;
+    }
+    return undefined;
+}

package/dist/agent/providers/opencode.d.ts ADDED Viewed

@@ -0,0 +1,10 @@
+/**
+ * OpenCode Zen & Go providers — runtime model discovery via /models +
+ * models.dev metadata enrichment.
+ *
+ * Registers two providers:
+ *   - opencode     — Zen tier  (https://opencode.ai/zen/v1)
+ *   - opencode-go  — Go tier   (https://opencode.ai/zen/go/v1)
+ */
+import type { AgentContext } from "../host-types.js";
+export default function activate(ctx: AgentContext): void;

package/dist/agent/providers/opencode.js ADDED Viewed

@@ -0,0 +1,112 @@
+import { resolveApiKey } from "../../cli/auth/keys.js";
+const ZEN_BASE_URL = "https://opencode.ai/zen/v1";
+const GO_BASE_URL = "https://opencode.ai/zen/go/v1";
+const MODELS_DEV_ENDPOINT = "https://models.dev/api.json";
+const DEFAULT_CTX = 128_000;
+const DEFAULT_MAX_TOKENS = 16_384;
+const ZEN_FALLBACK = ["claude-sonnet-4-6"];
+const GO_FALLBACK = ["gpt-5.2"];
+// ── Helpers ──────────────────────────────────────────────────────
+async function fetchJson(url) {
+    const res = await fetch(url, {
+        headers: { Accept: "application/json" },
+        signal: AbortSignal.timeout(15_000),
+    });
+    if (!res.ok)
+        throw new Error(`HTTP ${res.status}`);
+    return res.json();
+}
+function findEntry(provider, id) {
+    const direct = provider?.models?.[id];
+    if (direct)
+        return direct;
+    if (!provider?.models)
+        return undefined;
+    return Object.values(provider.models).find((m) => m.id === id);
+}
+function resolveModel(id, meta) {
+    const raw = meta?.modalities?.input;
+    const modalities = Array.isArray(raw)
+        ? raw.filter((v) => v === "text" || v === "image")
+        : ["text"];
+    return {
+        id,
+        reasoning: meta?.reasoning ?? false,
+        contextWindow: (typeof meta?.limit?.context === "number" && meta.limit.context > 0)
+            ? meta.limit.context : DEFAULT_CTX,
+        maxTokens: (typeof meta?.limit?.output === "number" && meta.limit.output > 0)
+            ? meta.limit.output : DEFAULT_MAX_TOKENS,
+        modalities,
+    };
+}
+function reasoningParams(level) {
+    if (level === "off")
+        return { reasoning_effort: "none" };
+    return { reasoning_effort: level === "xhigh" ? "high" : level };
+}
+// ── Activation ───────────────────────────────────────────────────
+export default function activate(ctx) {
+    const apiKey = process.env.OPENCODE_API_KEY ??
+        resolveApiKey("opencode").key ?? undefined;
+    ctx.agent.providers.configure("opencode", { reasoningParams });
+    ctx.agent.providers.register({
+        id: "opencode", apiKey, baseURL: ZEN_BASE_URL,
+        defaultModel: ZEN_FALLBACK[0], models: ZEN_FALLBACK,
+        supportsReasoningEffort: true,
+    });
+    ctx.agent.providers.configure("opencode-go", { reasoningParams });
+    ctx.agent.providers.register({
+        id: "opencode-go", apiKey, baseURL: GO_BASE_URL,
+        defaultModel: GO_FALLBACK[0], models: GO_FALLBACK,
+        supportsReasoningEffort: true,
+    });
+    if (!apiKey)
+        return;
+    fetchModelsDev()
+        .then(async (md) => {
+        const zenIds = await fetchModelIds(ZEN_BASE_URL);
+        const goIds = await fetchModelIds(GO_BASE_URL);
+        const resolve = (ids, prov, fb) => (ids.length > 0 ? ids : fb).map((id) => resolveModel(id, findEntry(prov, id)));
+        const zen = resolve(zenIds, md?.opencode, ZEN_FALLBACK);
+        const go = resolve(goIds, md?.["opencode-go"], GO_FALLBACK);
+        ctx.agent.providers.register({
+            id: "opencode", apiKey, baseURL: ZEN_BASE_URL,
+            defaultModel: zen[0]?.id ?? ZEN_FALLBACK[0], models: zen,
+            supportsReasoningEffort: true,
+        });
+        ctx.agent.providers.register({
+            id: "opencode-go", apiKey, baseURL: GO_BASE_URL,
+            defaultModel: go[0]?.id ?? GO_FALLBACK[0], models: go,
+            supportsReasoningEffort: true,
+        });
+    })
+        .catch(() => { });
+}
+async function fetchModelsDev() {
+    try {
+        const payload = await fetchJson(MODELS_DEV_ENDPOINT);
+        if (!payload || typeof payload !== "object" || Array.isArray(payload))
+            return undefined;
+        return payload;
+    }
+    catch {
+        return undefined;
+    }
+}
+async function fetchModelIds(baseURL) {
+    try {
+        const res = await fetch(`${baseURL}/models`, {
+            headers: { Accept: "application/json" },
+            signal: AbortSignal.timeout(10_000),
+        });
+        if (!res.ok)
+            return [];
+        const payload = await res.json();
+        if (!Array.isArray(payload.data))
+            return [];
+        return [...new Set(payload.data.map((e) => e.id).filter(Boolean))];
+    }
+    catch {
+        return [];
+    }
+}

package/dist/agent/providers/openrouter.js CHANGED Viewed

@@ -14,6 +14,14 @@ function buildReasoningParams(level, _model) {
         ? { reasoning: { effort: "none" } }
         : { reasoning: { effort: level } };
 }
+/** OpenRouter's input_modalities → the text/image subset; undefined when absent
+ *  so the fail-closed image guard treats the model as text-only. */
+function toModalities(input) {
+    if (!Array.isArray(input))
+        return undefined;
+    const out = input.filter((v) => v === "text" || v === "image");
+    return out.length ? out : undefined;
+}
 export default function activate(ctx) {
     const apiKey = resolveApiKey("openrouter").key;
     ctx.agent.providers.configure("openrouter", { reasoningParams: buildReasoningParams });
@@ -42,6 +50,7 @@ export default function activate(ctx) {
                 reasoning: m.supported_parameters?.includes("reasoning") ?? false,
                 contextWindow: m.context_length,
                 echoReasoning: userOverrides.get(m.id) ?? patterns.some((re) => re.test(m.id)),
+                modalities: toModalities(m.architecture?.input_modalities),
             })),
         });
     }).catch(() => { });

package/dist/agent/providers/zai-coding-plan.d.ts ADDED Viewed

@@ -0,0 +1,5 @@
+/**
+ * Z.AI Coding Plan — Zhipu AI's subscription GLM models for coding.
+ */
+import type { AgentContext } from "../host-types.js";
+export default function activate(ctx: AgentContext): void;

package/dist/agent/providers/zai-coding-plan.js ADDED Viewed

@@ -0,0 +1,26 @@
+import { resolveApiKey } from "../../cli/auth/keys.js";
+const BASE_URL = "https://api.z.ai/api/coding/paas/v4";
+const ID = "zai-coding-plan";
+const DEFAULT_MODELS = [
+    { id: "glm-5.1", reasoning: true, contextWindow: 200_000 },
+    { id: "glm-5-turbo", reasoning: true, contextWindow: 200_000 },
+    { id: "glm-4.7", reasoning: true, contextWindow: 204_800 },
+    { id: "glm-4.5-air", reasoning: true, contextWindow: 131_072 },
+];
+function buildReasoningParams(level, _model) {
+    if (level === "off")
+        return { thinking: { type: "disabled" } };
+    const effort = level === "xhigh" ? "high" : level;
+    return { thinking: { type: "enabled" }, reasoning_effort: effort };
+}
+export default function activate(ctx) {
+    const { key } = resolveApiKey(ID);
+    ctx.agent.providers.configure(ID, { reasoningParams: buildReasoningParams });
+    ctx.agent.providers.register({
+        id: ID,
+        apiKey: key ?? process.env.ZAI_API_KEY ?? process.env.ZHIPU_API_KEY,
+        baseURL: BASE_URL,
+        defaultModel: DEFAULT_MODELS[0].id,
+        models: DEFAULT_MODELS,
+    });
+}

package/dist/agent/subagent.js CHANGED Viewed

@@ -109,7 +109,7 @@ async function streamOnce(llmClient, systemPrompt, conversation, apiTools, model
     const stream = await llmClient.stream({
         messages: [
             { role: "system", content: systemPrompt },
-            ...wrapTrailingWithDynamicContext(conversation.getMessages(), dynamicContext ?? ""),
+            ...wrapTrailingWithDynamicContext(conversation.forLLM(), dynamicContext ?? ""),
         ],
         tools: apiTools.length > 0 ? apiTools : undefined,
         model,

package/dist/cli/args.js CHANGED Viewed

@@ -53,8 +53,8 @@ export function parseArgs(argv, env = process.env) {
     let provider;
     let backend;
     let shell = env.SHELL || "/bin/bash";
-    let apiKey = env.OPENAI_API_KEY;
-    let baseURL = env.OPENAI_BASE_URL;
+    let apiKey;
+    let baseURL;
     for (let i = 0; i < argv.length; i++) {
         const arg = argv[i];
         if (arg === "--model" && argv[i + 1]) {