npm - agent-sh - Versions diffs - 0.13.3 → 0.13.5 - Mend

agent-sh 0.13.3 → 0.13.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/dist/agent/agent-loop.d.ts +2 -0
package/dist/agent/agent-loop.js +115 -87
package/dist/agent/index.js +5 -12
package/dist/agent/providers/openai.d.ts +2 -0
package/dist/agent/providers/openai.js +9 -2
package/examples/extensions/ash-acp-bridge/src/index.ts +5 -2
package/examples/extensions/ashi/package.json +2 -2
package/examples/extensions/ashi/src/frontend.ts +95 -22
package/examples/extensions/ashi/src/multi-session-store.ts +8 -0
package/examples/extensions/ollama.ts +19 -17
package/examples/extensions/zai-coding-plan.ts +2 -1
package/package.json +1 -1
package/examples/extensions/ollama-cloud.ts +0 -78

package/dist/agent/agent-loop.d.ts CHANGED Viewed

@@ -42,6 +42,7 @@ export declare class AgentLoop implements AgentBackend {
     private ctorListeners;
     private ctorPipeListeners;
     private lastProjectSkillNames;
+    private lastAgentInfo;
     private sessionStartTime;
     private toolCallCounts;
     private totalToolCalls;
@@ -99,6 +100,7 @@ export declare class AgentLoop implements AgentBackend {
     private cancel;
     private reasoningParams;
     private get currentMode();
+    private emitAgentInfoIfChanged;
     private get currentModel();
     /**
      * Run compaction via the `conversation:compact` handler. After any

package/dist/agent/agent-loop.js CHANGED Viewed

@@ -60,6 +60,7 @@ export class AgentLoop {
     ctorListeners = [];
     ctorPipeListeners = [];
     lastProjectSkillNames = new Set();
+    lastAgentInfo = null;
     // ── Session telemetry — behavioral self-awareness ──────────────
     // Every ash deserves to know what it's been doing. This tracks the
     // agent's own behavioral patterns across the session: which tools
@@ -87,7 +88,7 @@ export class AgentLoop {
     // doing X." Addresses Q3 in QUESTIONS.md.
     lastErrorByTool = new Map(); // tool → error summary
     lastErrorByFile = new Map(); // file path → error summary
-    static THINKING_LEVELS = ["off", "low", "medium", "high"];
+    static THINKING_LEVELS = ["off", "low", "medium", "high", "xhigh"];
     bus;
     llmClient;
     handlers;
@@ -168,24 +169,20 @@ export class AgentLoop {
             ];
             if (prev) {
                 const newIdx = this.modes.findIndex((m) => m.model === prev.model && m.provider === prev.provider);
-                if (newIdx !== -1)
+                if (newIdx !== -1) {
                     this.currentModeIndex = newIdx;
+                    const next = this.modes[newIdx];
+                    if (next.providerConfig && next.providerConfig !== prev.providerConfig) {
+                        this.llmClient.reconfigure({ ...next.providerConfig, model: next.model });
+                    }
+                }
             }
             if (activePreserved && prev) {
                 this.bus.emit("ui:info", {
                     message: `${prev.provider}:${prev.model} is not in the refreshed catalog — keeping it active until you /model to another.`,
                 });
             }
-            const active = this.modes[this.currentModeIndex];
-            if (active && active.contextWindow !== prev?.contextWindow) {
-                this.bus.emit("agent:info", {
-                    name: "ash",
-                    version: PACKAGE_VERSION,
-                    model: active.model,
-                    provider: active.provider,
-                    contextWindow: active.contextWindow,
-                });
-            }
+            this.emitAgentInfoIfChanged();
             this.bus.emit("config:changed", {});
         });
         // Fires before wire() too — agent-backend emits this from
@@ -203,6 +200,7 @@ export class AgentLoop {
             else {
                 this.llmClient.model = m.model;
             }
+            this.emitAgentInfoIfChanged();
             this.bus.emit("config:changed", {});
         });
         const getToolsPipe = () => ({ tools: this.getTools() });
@@ -251,7 +249,7 @@ export class AgentLoop {
                 this.llmClient.model = m.model;
             }
             const label = m.provider ? `${m.provider}: ${m.model}` : m.model;
-            this.bus.emit("agent:info", { name: "ash", version: PACKAGE_VERSION, model: m.model, provider: m.provider, contextWindow: m.contextWindow });
+            this.emitAgentInfoIfChanged();
             // Persist as the new default — selection survives restart.
             // Safe even for dynamic providers: agent-backend defers mode
             // resolution to `core:extensions-loaded`, so the extension gets
@@ -370,6 +368,8 @@ export class AgentLoop {
                 this.bus.emit("conversation:message-appended", { role: "system", content: note });
             }
         });
+        this.lastAgentInfo = null;
+        this.emitAgentInfoIfChanged();
     }
     /** Unsubscribe from bus events — deactivates this backend. */
     unwire() {
@@ -507,11 +507,29 @@ export class AgentLoop {
             return mode.buildReasoningParams(this.thinkingLevel);
         if (this.thinkingLevel === "off")
             return {};
-        return { reasoning_effort: this.thinkingLevel };
+        const effort = this.thinkingLevel === "xhigh" ? "high" : this.thinkingLevel;
+        return { reasoning_effort: effort };
     }
     get currentMode() {
         return this.modes[this.currentModeIndex];
     }
+    emitAgentInfoIfChanged() {
+        const m = this.modes[this.currentModeIndex];
+        if (!m)
+            return;
+        const prev = this.lastAgentInfo;
+        if (prev && prev.model === m.model && prev.provider === m.provider && prev.contextWindow === m.contextWindow) {
+            return;
+        }
+        this.lastAgentInfo = { model: m.model, provider: m.provider, contextWindow: m.contextWindow };
+        this.bus.emit("agent:info", {
+            name: "ash",
+            version: PACKAGE_VERSION,
+            model: m.model,
+            provider: m.provider,
+            contextWindow: m.contextWindow,
+        });
+    }
     get currentModel() {
         return this.modes[this.currentModeIndex].model;
     }
@@ -1076,12 +1094,15 @@ export class AgentLoop {
                 streamedCalls: streamedToolCalls,
             });
             fullResponseText += text;
-            // Record the assistant message via protocol
-            this.toolProtocol.recordAssistant(this.conversation, text, toolCalls, extras);
-            this.bus.emit("conversation:message-appended", {
-                role: "assistant",
-                content: text,
-            });
+            if (text || toolCalls.length > 0) {
+                this.toolProtocol.recordAssistant(this.conversation, text, toolCalls, extras);
+                this.bus.emit("conversation:message-appended", {
+                    role: "assistant",
+                    content: text,
+                });
+            }
+            if (signal.aborted)
+                break;
             // No tool calls → agent is done
             if (toolCalls.length === 0) {
                 this.conversation.eagerNucleateAgent(fullResponseText);
@@ -1502,83 +1523,90 @@ export class AgentLoop {
         };
         this.bus.emit("llm:request", requestParams);
         const stream = await this.llmClient.stream({ ...requestParams, signal });
-        for await (const chunk of stream) {
-            if (signal.aborted)
-                break;
-            this.bus.emit("llm:chunk", { chunk });
-            // Token usage (may arrive in a chunk with empty choices)
-            if (chunk.usage) {
-                const u = chunk.usage;
-                const promptTokens = u.prompt_tokens ?? 0;
-                this.bus.emit("agent:usage", {
-                    prompt_tokens: promptTokens,
-                    completion_tokens: u.completion_tokens ?? 0,
-                    total_tokens: u.total_tokens ?? 0,
-                });
-                // Feed accurate token count back to conversation state
-                if (promptTokens > 0) {
-                    this.conversation.updateApiTokenCount(promptTokens);
-                }
-            }
-            const choice = chunk.choices[0];
-            if (!choice)
-                continue;
-            const delta = choice.delta;
-            // Text content
-            if (delta?.content) {
-                text += delta.content;
-                // Filter tool tags from display output (inline mode)
-                const displayText = streamFilter
-                    ? streamFilter.feed(delta.content)
-                    : delta.content;
-                if (displayText) {
-                    this.bus.emitTransform("agent:response-chunk", {
-                        blocks: [{ type: "text", text: displayText }],
+        try {
+            for await (const chunk of stream) {
+                if (signal.aborted)
+                    break;
+                this.bus.emit("llm:chunk", { chunk });
+                // Token usage (may arrive in a chunk with empty choices)
+                if (chunk.usage) {
+                    const u = chunk.usage;
+                    const promptTokens = u.prompt_tokens ?? 0;
+                    this.bus.emit("agent:usage", {
+                        prompt_tokens: promptTokens,
+                        completion_tokens: u.completion_tokens ?? 0,
+                        total_tokens: u.total_tokens ?? 0,
                     });
+                    // Feed accurate token count back to conversation state
+                    if (promptTokens > 0) {
+                        this.conversation.updateApiTokenCount(promptTokens);
+                    }
                 }
-            }
-            const d = delta;
-            for (const name of ["reasoning", "reasoning_content"]) {
-                if (typeof d?.[name] === "string" && d[name].length > 0) {
-                    reasoning += d[name];
-                    reasoningField ??= name;
-                    this.bus.emit("agent:thinking-chunk", { text: d[name] });
-                }
-            }
-            if (Array.isArray(d?.reasoning_details)) {
-                for (const x of d.reasoning_details) {
-                    const idx = typeof x?.index === "number" ? x.index : reasoningDetailsByIndex.size;
-                    const prev = reasoningDetailsByIndex.get(idx);
-                    if (!prev) {
-                        reasoningDetailsByIndex.set(idx, { ...x });
+                const choice = chunk.choices[0];
+                if (!choice)
+                    continue;
+                const delta = choice.delta;
+                // Text content
+                if (delta?.content) {
+                    text += delta.content;
+                    // Filter tool tags from display output (inline mode)
+                    const displayText = streamFilter
+                        ? streamFilter.feed(delta.content)
+                        : delta.content;
+                    if (displayText) {
+                        this.bus.emitTransform("agent:response-chunk", {
+                            blocks: [{ type: "text", text: displayText }],
+                        });
                     }
-                    else {
-                        if (typeof x.text === "string")
-                            prev.text = (prev.text ?? "") + x.text;
-                        for (const [k, v] of Object.entries(x))
-                            if (k !== "text" && prev[k] === undefined)
-                                prev[k] = v;
+                }
+                const d = delta;
+                for (const name of ["reasoning", "reasoning_content"]) {
+                    if (typeof d?.[name] === "string" && d[name].length > 0) {
+                        reasoning += d[name];
+                        reasoningField ??= name;
+                        this.bus.emit("agent:thinking-chunk", { text: d[name] });
                     }
                 }
-            }
-            // Tool calls (streamed incrementally)
-            if (delta?.tool_calls) {
-                for (const tc of delta.tool_calls) {
-                    const idx = tc.index;
-                    if (!pendingToolCalls[idx]) {
-                        pendingToolCalls[idx] = {
-                            id: tc.id,
-                            name: tc.function.name,
-                            argumentsJson: "",
-                        };
+                if (Array.isArray(d?.reasoning_details)) {
+                    for (const x of d.reasoning_details) {
+                        const idx = typeof x?.index === "number" ? x.index : reasoningDetailsByIndex.size;
+                        const prev = reasoningDetailsByIndex.get(idx);
+                        if (!prev) {
+                            reasoningDetailsByIndex.set(idx, { ...x });
+                        }
+                        else {
+                            if (typeof x.text === "string")
+                                prev.text = (prev.text ?? "") + x.text;
+                            for (const [k, v] of Object.entries(x))
+                                if (k !== "text" && prev[k] === undefined)
+                                    prev[k] = v;
+                        }
                     }
-                    if (tc.function?.arguments) {
-                        pendingToolCalls[idx].argumentsJson +=
-                            tc.function.arguments;
+                }
+                // Tool calls (streamed incrementally)
+                if (delta?.tool_calls) {
+                    for (const tc of delta.tool_calls) {
+                        const idx = tc.index;
+                        if (!pendingToolCalls[idx]) {
+                            pendingToolCalls[idx] = {
+                                id: tc.id,
+                                name: tc.function.name,
+                                argumentsJson: "",
+                            };
+                        }
+                        if (tc.function?.arguments) {
+                            pendingToolCalls[idx].argumentsJson +=
+                                tc.function.arguments;
+                        }
                     }
                 }
             }
         }
+        catch (e) {
+            // On abort, fall through with whatever was accumulated so far.
+            if (!signal.aborted)
+                throw e;
+        }
         // Flush any buffered content from the stream filter
         if (streamFilter) {
             const remaining = streamFilter.flush();

package/dist/agent/index.js CHANGED Viewed

@@ -2,7 +2,6 @@ import { AgentLoop } from "./agent-loop.js";
 import { LlmClient } from "../utils/llm-client.js";
 import { createLlmFacade } from "../utils/llm-facade.js";
 import { resolveProvider, getProviderNames, getSettings } from "../core/settings.js";
-import { PACKAGE_VERSION } from "../utils/package-version.js";
 import { discoverSkills } from "./skills.js";
 import { resolveApiKey } from "../cli/auth/keys.js";
 import activateOpenrouter from "./providers/openrouter.js";
@@ -15,7 +14,9 @@ function persistedModelFor(providerName) {
     return getSettings().providers?.[providerName]?.defaultModel;
 }
 function defaultReasoningBuilder(level) {
-    return level === "off" ? {} : { reasoning_effort: level };
+    if (level === "off")
+        return {};
+    return { reasoning_effort: level === "xhigh" ? "high" : level };
 }
 function mergeCaps(settingsCaps, payloadCaps, modelIds) {
     if (!settingsCaps)
@@ -118,11 +119,12 @@ export default function agentBackend(ctx) {
     ctx.define("llm:get-client", () => llmClient);
     ctx.define("llm:invoke", (messages, opts) => {
         const effort = opts?.reasoningEffort;
+        const clampedEffort = effort === "xhigh" ? "high" : effort;
         return llmClient.complete({
             messages: messages,
             max_tokens: opts?.maxTokens,
             model: opts?.model,
-            ...(effort && effort !== "off" ? { reasoning_effort: effort } : {}),
+            ...(clampedEffort && clampedEffort !== "off" ? { reasoning_effort: clampedEffort } : {}),
         });
     });
     let modes = [];
@@ -224,13 +226,6 @@ export default function agentBackend(ctx) {
                         });
                     },
                 });
-                bus.emit("agent:info", {
-                    name: "ash",
-                    version: PACKAGE_VERSION,
-                    model: llmClient.model,
-                    provider: modes[initialModeIndex]?.provider,
-                    contextWindow: modes[initialModeIndex]?.contextWindow,
-                });
             },
         });
     });
@@ -327,9 +322,7 @@ export default function agentBackend(ctx) {
             };
         });
         bus.emit("config:set-modes", { modes: newModes });
-        bus.emit("agent:info", { name: "ash", version: PACKAGE_VERSION, model: switchModel, provider: name, contextWindow: p.contextWindow });
         bus.emit("ui:info", { message: `Switched to ${name} (${switchModel})` });
-        bus.emit("config:changed", {});
     });
     bus.onPipe("banner:collect", (e) => {
         if (e.activeBackend && e.activeBackend !== "ash")

package/dist/agent/providers/openai.d.ts CHANGED Viewed

@@ -2,6 +2,8 @@
  * Cloud OpenAI (api.openai.com). reasoning_effort vocabulary diverges per
  * family: o-series has no off; gpt-5-codex floors at "low"; plain gpt-5
  * floors at "minimal"; gpt-5.1+ accepts "none" as documented full off.
+ * Top tier: only gpt-5.1-codex-max and gpt-5.[4-9]+ accept "xhigh"; others
+ * clamp to "high".
  */
 import type { AgentContext } from "../host-types.js";
 export default function activate(ctx: AgentContext): void;

package/dist/agent/providers/openai.js CHANGED Viewed

@@ -18,9 +18,16 @@ function offEffortFor(model) {
         return "minimal";
     return null;
 }
+function supportsXhigh(model) {
+    if (model.startsWith("gpt-5.1-codex-max"))
+        return true;
+    return /^gpt-5\.[4-9]/.test(model);
+}
 function buildReasoningParams(level, model) {
-    if (level !== "off")
-        return { reasoning_effort: level };
+    if (level !== "off") {
+        const effort = level === "xhigh" && !(model && supportsXhigh(model)) ? "high" : level;
+        return { reasoning_effort: effort };
+    }
     const off = model ? offEffortFor(model) : null;
     return off ? { reasoning_effort: off } : {};
 }

package/examples/extensions/ash-acp-bridge/src/index.ts CHANGED Viewed

@@ -446,10 +446,13 @@ function getModelsPayload(): Record<string, unknown> | undefined {
   if (!core) return undefined;
   const info = core.bus.emitPipe("config:get-models", { models: [], active: null });
   if (!info.models.length) return undefined;
+  const idFor = (m: { model: string; provider: string }) =>
+    m.provider ? `${m.model}@${m.provider}` : m.model;
+  const current = info.active ?? info.models[0]!;
   return {
-    currentModelId: info.active?.model ?? info.models[0]?.model,
+    currentModelId: idFor(current),
     availableModels: info.models.map((m) => ({
-      modelId: m.model,
+      modelId: idFor(m),
       name: m.provider ? `${m.provider}/${m.model}` : m.model,
       description: m.provider ? `Provider: ${m.provider}` : "",
     })),

package/examples/extensions/ashi/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@guanyilun/ashi",
-  "version": "0.1.1",
+  "version": "0.1.4",
   "description": "Ash in an interactive TUI — agent-sh's built-in agent without the shell underneath",
   "type": "module",
   "main": "dist/cli.js",
@@ -48,7 +48,7 @@
   },
   "dependencies": {
     "@earendil-works/pi-tui": "^0.74.0",
-    "agent-sh": "^0.13.2",
+    "agent-sh": "^0.13.3",
     "chalk": "^5.5.0",
     "cli-highlight": "^2.1.11"
   },

package/examples/extensions/ashi/src/frontend.ts CHANGED Viewed

@@ -175,6 +175,7 @@ export function mountAshi(
   const chat = new Container();
   const footerSlot = new Container();
+  const queueSlot = new Container();
   const editor = new Editor(tui, editorTheme(), { paddingX: 1 });
   editor.setAutocompleteProvider(new BusAutocompleteProvider(bus));
   editor.onSubmit = (text) => {
@@ -188,6 +189,12 @@ export function mountAshi(
       bus.emit("command:execute", { name, args });
       return;
     }
+    if (processing) {
+      queuedQueries.push(query);
+      renderQueueSlot();
+      tui.requestRender();
+      return;
+    }
     bus.emit("agent:submit", { query });
   };
@@ -211,6 +218,7 @@ export function mountAshi(
   tui.addChild(chat);
   tui.addChild(footerSlot);
+  tui.addChild(queueSlot);
   tui.addChild(editor);
   tui.addChild(statusFooter);
   tui.setFocus(editor);
@@ -227,6 +235,16 @@ export function mountAshi(
   let lastToolResult: ToolResultView | null = null;
   let loader: Loader | null = null;
   let processing = false;
+  const queuedQueries: string[] = [];
+  const renderQueueSlot = (): void => {
+    queueSlot.clear();
+    for (const q of queuedQueries) {
+      const oneLine = q.replace(/\s+/g, " ");
+      const preview = oneLine.length > 80 ? oneLine.slice(0, 77) + "…" : oneLine;
+      queueSlot.addChild(new InfoLine(`↳ queued: ${preview}`));
+    }
+  };
   let hideThinking = true;
   const renderState = (): { state: Record<string, unknown>; invalidate: () => void } => ({
@@ -552,6 +570,11 @@ export function mountAshi(
     chat.addChild(new Spacer(1));
     refreshFooterStats();
     refreshBranch();
+    const next = queuedQueries.shift();
+    if (next !== undefined) {
+      renderQueueSlot();
+      bus.emit("agent:submit", { query: next });
+    }
     tui.requestRender();
   });
@@ -612,6 +635,9 @@ export function mountAshi(
   // ── Pickers ────────────────────────────────────────────────────
   let pickerOpen = false;
+  let activeSessionPicker: SelectList | null = null;
+  let activeSessionRepopulate: ((keepIndex?: number) => boolean) | null = null;
+  let activeSessionClose: (() => void) | null = null;
   const openTreePicker = async (): Promise<void> => {
     if (pickerOpen) return;
@@ -657,38 +683,60 @@ export function mountAshi(
   const openSessionPicker = async (): Promise<void> => {
     if (pickerOpen) return;
-    const currentId = getStore().current().id;
-    const list = getStore().listSessions().filter((s) => s.id !== currentId);
-    if (list.length === 0) {
-      bus.emit("ui:info", { message: "no past sessions in this cwd" });
-      return;
-    }
-    const items: SelectItem[] = list.map((s) => ({
-      value: s.id,
-      label: formatSessionRow(s, false),
-    }));
-    const picker = new SelectList(items, 15, selectListTheme());
+    const hint = new InfoLine("↑↓ move · enter: resume · d: delete · esc: cancel");
     const close = (): void => {
+      if (activeSessionPicker) footerSlot.removeChild(activeSessionPicker);
+      footerSlot.removeChild(hint);
+      activeSessionPicker = null;
+      activeSessionRepopulate = null;
+      activeSessionClose = null;
       pickerOpen = false;
-      footerSlot.removeChild(picker);
       tui.setFocus(editor);
       tui.requestRender();
     };
-    picker.onSelect = async (item) => {
-      const id = item.value;
-      close();
-      resumeSession(ctx, getStore, capture, id);
-      bus.emit("ui:info", { message: `resumed session ${id}` });
-      await rebuildChat();
-      refreshFooterStats();
+    const populate = (keepIndex?: number): boolean => {
+      if (activeSessionPicker) footerSlot.removeChild(activeSessionPicker);
+      const currentId = getStore().current().id;
+      const list = getStore().listSessions().filter((s) => s.id !== currentId);
+      if (list.length === 0) {
+        activeSessionPicker = null;
+        return false;
+      }
+      const items: SelectItem[] = list.map((s) => ({
+        value: s.id,
+        label: formatSessionRow(s, false),
+      }));
+      const picker = new SelectList(items, 15, selectListTheme());
+      if (keepIndex !== undefined) {
+        picker.setSelectedIndex(Math.min(keepIndex, items.length - 1));
+      }
+      picker.onSelect = async (item) => {
+        const id = item.value;
+        close();
+        resumeSession(ctx, getStore, capture, id);
+        bus.emit("ui:info", { message: `resumed session ${id}` });
+        await rebuildChat();
+        refreshFooterStats();
+      };
+      picker.onCancel = close;
+      activeSessionPicker = picker;
+      footerSlot.addChild(picker);
+      tui.setFocus(picker);
+      return true;
     };
-    picker.onCancel = close;
+    footerSlot.addChild(hint);
+    if (!populate()) {
+      footerSlot.removeChild(hint);
+      bus.emit("ui:info", { message: "no past sessions in this cwd" });
+      return;
+    }
     pickerOpen = true;
-    footerSlot.addChild(picker);
-    tui.setFocus(picker);
+    activeSessionRepopulate = populate;
+    activeSessionClose = close;
     tui.requestRender();
   };
@@ -711,6 +759,31 @@ export function mountAshi(
       bus.emit("agent:cancel-request", {});
       return { consume: true };
     }
+    if (activeSessionPicker && matchesKey(data, "d")) {
+      const selected = activeSessionPicker.getSelectedItem();
+      if (selected) {
+        const currentId = getStore().current().id;
+        const idx = getStore().listSessions()
+          .filter((s) => s.id !== currentId)
+          .findIndex((s) => s.id === selected.value);
+        try {
+          getStore().deleteSession(selected.value);
+        } catch (e) {
+          bus.emit("ui:error", { message: `delete failed: ${(e as Error).message}` });
+          return { consume: true };
+        }
+        if (!activeSessionRepopulate?.(idx)) activeSessionClose?.();
+        tui.requestRender();
+      }
+      return { consume: true };
+    }
+    if (matchesKey(data, "up") && queuedQueries.length > 0 && editor.getText().length === 0) {
+      const last = queuedQueries.pop()!;
+      renderQueueSlot();
+      editor.setText(last);
+      tui.requestRender();
+      return { consume: true };
+    }
     if (matchesKey(data, "ctrl+c")) {
       editor.setText("");
       return { consume: true };

package/examples/extensions/ashi/src/multi-session-store.ts CHANGED Viewed

@@ -81,6 +81,14 @@ export class MultiSessionStore {
     return this.currentStore;
   }
+  deleteSession(id: string): void {
+    if (id === this.currentStore.id) throw new Error("cannot delete the active session");
+    const filePath = this.sessionFile(id);
+    for (const p of [filePath, filePath + ".leaf", filePath + ".meta"]) {
+      try { fs.unlinkSync(p); } catch { /* missing siblings are fine */ }
+    }
+  }
   listSessions(): SessionInfo[] {
     let names: string[];
     try { names = fs.readdirSync(this.dir); } catch { return []; }

package/examples/extensions/ollama.ts CHANGED Viewed

@@ -1,44 +1,46 @@
 /**
- * Ollama provider extension — local daemon and Ollama Cloud.
+ * Ollama provider extension — local daemon or Ollama Cloud.
  *
- *   OLLAMA_API_KEY  → Ollama Cloud (https://ollama.com)
- *   OLLAMA_HOST     → local host override (default http://localhost:11434)
+ * Cloud auth (any of):
+ *   agent-sh auth login ollama-cloud   # preferred
+ *   OLLAMA_API_KEY=...                 # env fallback
+ *
+ * Local host:
+ *   OLLAMA_HOST (default http://localhost:11434)
  *
  * Catalog comes from /api/tags; per-model context length is fetched
  * from /api/show (model_info["${arch}.context_length"]). Chat goes
  * through the OpenAI-compatible /v1/chat/completions shim.
  *
- * Setup (cloud):
- *   export OLLAMA_API_KEY="your-key"
- *
- * Setup (local):
- *   ollama serve   # default http://localhost:11434
- *
  * Usage:
  *   agent-sh -e ./examples/extensions/ollama.ts
  *
  *   # Or add to settings.json:
  *   { "extensions": ["./examples/extensions/ollama.ts"] }
  */
-import type { ExtensionContext } from "agent-sh/types";
+import { resolveApiKey } from "agent-sh/auth";
+import type { AgentContext } from "agent-sh/types";
 const ECHO_REASONING_PATTERNS: RegExp[] = [/deepseek/i];
-export default function activate(ctx: ExtensionContext): void {
-  const apiKey = process.env.OLLAMA_API_KEY;
-  const host = apiKey
+export default function activate(ctx: AgentContext): void {
+  const cloudKey = resolveApiKey("ollama-cloud").key ?? process.env.OLLAMA_API_KEY;
+  const host = cloudKey
     ? "https://ollama.com"
     : (process.env.OLLAMA_HOST ?? "http://localhost:11434").replace(/\/$/, "");
-  const id = apiKey ? "ollama-cloud" : "ollama";
+  const id = cloudKey ? "ollama-cloud" : "ollama";
   // OpenAI SDK rejects an empty apiKey; the local daemon ignores the value.
-  const sdkKey = apiKey || "no-key";
+  const sdkKey = cloudKey || "no-key";
   const baseURL = `${host}/v1`;
   const headers: Record<string, string> = {};
-  if (apiKey) headers.Authorization = `Bearer ${apiKey}`;
+  if (cloudKey) headers.Authorization = `Bearer ${cloudKey}`;
   ctx.agent.providers.configure(id, {
-    reasoningParams: (level) => ({ reasoning_effort: level === "off" ? "none" : level }),
+    reasoningParams: (level) => {
+      if (level === "off") return { reasoning_effort: "none" };
+      return { reasoning_effort: level === "xhigh" ? "high" : level };
+    },
   });
   ctx.bus.emit("provider:register", { id, apiKey: sdkKey, baseURL, models: [] });

package/examples/extensions/zai-coding-plan.ts CHANGED Viewed

@@ -19,7 +19,8 @@ const DEFAULT_MODELS = [
 function buildReasoningParams(level: string, _model?: string): Record<string, unknown> {
   if (level === "off") return { thinking: { type: "disabled" } };
-  return { thinking: { type: "enabled" }, reasoning_effort: level };
+  const effort = level === "xhigh" ? "high" : level;
+  return { thinking: { type: "enabled" }, reasoning_effort: effort };
 }
 export default function activate(ctx: AgentContext): void {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "agent-sh",
-  "version": "0.13.3",
+  "version": "0.13.5",
   "description": "A shell-first terminal where AI is one keystroke away",
   "type": "module",
   "main": "dist/core/index.js",

package/examples/extensions/ollama-cloud.ts DELETED Viewed

@@ -1,78 +0,0 @@
-/**
- * Ollama Cloud — hosted Ollama models (https://ollama.com).
- *
- * Auth:  agent-sh auth login ollama-cloud
- * Usage: agent-sh -e ./examples/extensions/ollama-cloud.ts
- */
-import { resolveApiKey } from "agent-sh/auth";
-import type { AgentContext } from "agent-sh/types";
-const HOST = "https://ollama.com";
-const BASE_URL = `${HOST}/v1`;
-const ID = "ollama-cloud";
-function buildReasoningParams(level: string, _model?: string): Record<string, unknown> {
-  return { reasoning_effort: level === "off" ? "none" : level };
-}
-async function fetchModels(apiKey: string) {
-  const headers: Record<string, string> = { Authorization: `Bearer ${apiKey}` };
-  const tagsRes = await fetch(`${HOST}/api/tags`, { headers });
-  if (!tagsRes.ok) return [];
-  const tagsData = await tagsRes.json() as { models?: { name: string }[] };
-  const names = (tagsData.models ?? []).map((m) => m.name);
-  if (!names.length) return [];
-  const ctxs = await Promise.all(
-    names.map((name) =>
-      fetch(`${HOST}/api/show`, {
-        method: "POST",
-        headers: { ...headers, "Content-Type": "application/json" },
-        body: JSON.stringify({ name }),
-      })
-        .then((r) => r.ok ? r.json() as Promise<{ model_info?: Record<string, unknown> }> : null)
-        .then((d) => {
-          if (!d?.model_info) return undefined;
-          const info = d.model_info;
-          const arch = info["general.architecture"] as string | undefined;
-          if (arch) {
-            const ctx = info[`${arch}.context_length`];
-            if (typeof ctx === "number") return ctx;
-          }
-          for (const [k, v] of Object.entries(info)) {
-            if (k.endsWith(".context_length") && typeof v === "number") return v;
-          }
-          return undefined;
-        })
-        .catch(() => undefined),
-    ),
-  );
-  return names.map((name, i) => ({
-    id: name,
-    contextWindow: ctxs[i],
-    echoReasoning: /deepseek/i.test(name),
-  }));
-}
-export default function activate(ctx: AgentContext): void {
-  const { key } = resolveApiKey(ID);
-  const apiKey = key ?? process.env.OLLAMA_API_KEY;
-  if (!apiKey) return;
-  ctx.agent.providers.configure(ID, { reasoningParams: buildReasoningParams });
-  // Register placeholder while catalog loads
-  ctx.bus.emit("provider:register", { id: ID, apiKey, baseURL: BASE_URL, models: [] });
-  fetchModels(apiKey).then((models) => {
-    if (!models.length) return;
-    ctx.bus.emit("provider:register", {
-      id: ID,
-      apiKey,
-      baseURL: BASE_URL,
-      defaultModel: models[0]!.id,
-      models,
-    });
-  }).catch(() => { /* keep placeholder */ });
-}