npm - agent-sh - Versions diffs - 0.9.0 → 0.10.0 - Mend

agent-sh 0.9.0 → 0.10.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (78) hide show

package/README.md +14 -21
package/dist/agent/agent-loop.d.ts +43 -3
package/dist/agent/agent-loop.js +811 -128
package/dist/agent/conversation-state.d.ts +72 -21
package/dist/agent/conversation-state.js +357 -150
package/dist/agent/history-file.d.ts +13 -4
package/dist/agent/history-file.js +110 -36
package/dist/agent/nuclear-form.d.ts +28 -3
package/dist/agent/nuclear-form.js +84 -3
package/dist/agent/skills.d.ts +2 -4
package/dist/agent/skills.js +10 -4
package/dist/agent/subagent.d.ts +23 -0
package/dist/agent/subagent.js +53 -11
package/dist/agent/system-prompt.d.ts +34 -1
package/dist/agent/system-prompt.js +96 -47
package/dist/agent/token-budget.d.ts +5 -4
package/dist/agent/token-budget.js +14 -19
package/dist/agent/tool-protocol.d.ts +23 -1
package/dist/agent/tool-protocol.js +169 -4
package/dist/agent/tools/bash.js +3 -3
package/dist/agent/tools/edit-file.js +9 -6
package/dist/agent/tools/glob.js +4 -2
package/dist/agent/tools/grep.js +27 -3
package/dist/agent/tools/ls.js +5 -6
package/dist/agent/types.d.ts +1 -1
package/dist/context-manager.d.ts +17 -0
package/dist/context-manager.js +37 -4
package/dist/core.js +27 -6
package/dist/event-bus.d.ts +59 -2
package/dist/executor.d.ts +4 -3
package/dist/executor.js +18 -15
package/dist/extension-loader.js +50 -13
package/dist/extensions/agent-backend.d.ts +8 -7
package/dist/extensions/agent-backend.js +69 -48
package/dist/extensions/index.js +0 -1
package/dist/extensions/slash-commands.js +14 -9
package/dist/extensions/tui-renderer.js +62 -78
package/dist/index.js +25 -6
package/dist/settings.d.ts +36 -5
package/dist/settings.js +53 -9
package/dist/shell/input-handler.d.ts +2 -1
package/dist/shell/input-handler.js +82 -73
package/dist/shell/shell.js +19 -2
package/dist/types.d.ts +12 -0
package/dist/utils/ansi.d.ts +5 -0
package/dist/utils/ansi.js +1 -1
package/dist/utils/compositor.d.ts +5 -0
package/dist/utils/compositor.js +31 -3
package/dist/utils/diff-renderer.d.ts +9 -0
package/dist/utils/diff-renderer.js +221 -143
package/dist/utils/diff.d.ts +21 -2
package/dist/utils/diff.js +165 -89
package/dist/utils/handler-registry.d.ts +5 -0
package/dist/utils/handler-registry.js +6 -0
package/dist/utils/line-editor.d.ts +11 -1
package/dist/utils/line-editor.js +44 -5
package/dist/utils/tool-display.d.ts +1 -1
package/dist/utils/tool-display.js +4 -4
package/examples/extensions/ash-acp-bridge/src/index.ts +4 -1
package/examples/extensions/ash-mcp-bridge/index.ts +13 -3
package/examples/extensions/claude-code-bridge/index.ts +198 -51
package/examples/extensions/claude-code-bridge/package.json +1 -0
package/examples/extensions/interactive-prompts.ts +39 -25
package/examples/extensions/overlay-agent.ts +3 -3
package/examples/extensions/peer-mesh.ts +115 -0
package/examples/extensions/pi-bridge/index.ts +2 -2
package/examples/extensions/questionnaire.ts +16 -5
package/examples/extensions/subagents.ts +19 -4
package/examples/extensions/terminal-buffer.ts +163 -0
package/examples/extensions/user-shell.ts +136 -0
package/examples/extensions/web-access.ts +8 -0
package/package.json +36 -2
package/dist/agent/tools/display.d.ts +0 -13
package/dist/agent/tools/display.js +0 -70
package/dist/agent/tools/user-shell.d.ts +0 -13
package/dist/agent/tools/user-shell.js +0 -87
package/dist/extensions/terminal-buffer.d.ts +0 -14
package/dist/extensions/terminal-buffer.js +0 -134

package/README.md CHANGED Viewed

@@ -5,16 +5,18 @@ An agent that lives in a shell — not a shell that lives in an agent.
 [![npm version](https://img.shields.io/npm/v/agent-sh.svg)](https://www.npmjs.com/package/agent-sh)
 [![license](https://img.shields.io/npm/l/agent-sh.svg)](https://github.com/guanyilun/agent-sh/blob/main/LICENSE)
+![demo](assets/demo.gif)
 Most AI terminal tools get this backwards: the LLM drives the experience and the shell is bolted on as an afterthought. No real PTY, no job control, no vim, fragile `cd` tracking. The agent is the main character and your terminal is a prop.
 agent-sh flips this. It's your shell first — full PTY, your rc config, your aliases, everything just works. But type `>` at the start of a line, and you're talking to an agent that has full context of what you've been doing.
 ```
-~ $ ls -la                          # real shell command
-~ $ cd ../tests && npm test          # real cd, env, aliases — all just work
-~ $ vim file.ts                      # opens vim in the same PTY
-~ $ > explain the last error          # agent investigates using its own tools
-~ $ > deploy to staging              # agent runs it in your live shell
+~ $ ls -la                       # real shell command
+~ $ cd ../tests && npm test      # real cd, env, aliases — all just work
+~ $ vim file.ts                  # opens vim in the same PTY
+~ $ > explain the last error     # agent investigates using its own tools
+~ $ > draft a commit message     # agent reads your diff and shell history
 ```
 ## Quick Start
@@ -24,6 +26,12 @@ npm install -g agent-sh
 agent-sh
 ```
+Tip: add an alias to your shell config for quick access:
+```bash
+alias ash="agent-sh"
+```
 Set `OPENAI_API_KEY` in your environment (or configure providers in `~/.agent-sh/settings.json`). Works with any OpenAI-compatible API — see the [Usage Guide](docs/usage.md) for provider examples (OpenAI, Ollama, OpenRouter, Together, Groq, LM Studio, vLLM).
 Requires Node.js 18+.
@@ -32,7 +40,7 @@ Requires Node.js 18+.
 **Real terminal, zero compromise.** Full PTY with your shell config, aliases, and environment. Shell starts instantly — the agent connects asynchronously in the background.
-**One entry point, three tool categories.** Type `>` and agent-sh figures out how to help. Scratchpad tools (`bash`, `read_file`, `grep`, `glob`) for investigation. `display` to show you output. `user_shell` for commands with lasting effects in your live shell. No modes to pick — the agent reasons about which tools to use based on your intent.
+**One entry point, smart tool selection.** Type `>` and agent-sh figures out how to help. Scratchpad tools (`bash`, `read_file`, `grep`, `glob`) for investigation. Extensions add capabilities like running commands in your live shell. No modes to pick — the agent reasons about which tools to use based on your intent.
 **Context that just works.** Every query includes your cwd, recent commands, and their output. Run a failing test, type `> fix this`, and agent-sh knows exactly what happened. Context management works like shell history — continuous, persistent across restarts, no sessions to manage. See [Context Management](docs/context-management.md).
@@ -42,21 +50,6 @@ Requires Node.js 18+.
 **Embeddable as a library.** The core is a headless kernel — `import { createCore } from "agent-sh"` to build WebSocket servers, REST APIs, Electron apps, or test harnesses. No terminal required.
-## Slash Commands
-| Command | Description |
-|---|---|
-| `/help` | Show available commands |
-| `/model [name]` | Cycle to the next model, or switch to a specific one |
-| `/backend [name]` | List backends, or switch to a named backend |
-| `/compact` | Compact conversation (free up context space) |
-| `/context` | Show context budget usage |
-| `/thinking [level]` | Set reasoning effort (off, low, medium, high) |
-## Configuration
-Configure via `~/.agent-sh/settings.json`. See the [Usage Guide](docs/usage.md#configuration) for the full settings reference.
 ## Documentation
 - [Usage Guide](docs/usage.md) — providers, models, configuration

package/dist/agent/agent-loop.d.ts CHANGED Viewed

@@ -27,6 +27,8 @@ export interface AgentLoopConfig {
     modes?: AgentMode[];
     initialModeIndex?: number;
     compositor?: Compositor;
+    /** Instance ID from core — ensures history entries match the ID in prompts. */
+    instanceId?: string;
 }
 export declare class AgentLoop implements AgentBackend {
     private abortController;
@@ -41,6 +43,18 @@ export declare class AgentLoop implements AgentBackend {
     private ctorListeners;
     private ctorPipeListeners;
     private lastProjectSkillNames;
+    private sessionStartTime;
+    private toolCallCounts;
+    private totalToolCalls;
+    private totalToolErrors;
+    private totalResolutions;
+    private compactionCount;
+    private cumulativeCompactedTokens;
+    private peakConversationTokens;
+    private queryCount;
+    private totalLoopIterations;
+    private lastErrorByTool;
+    private lastErrorByFile;
     private static readonly THINKING_LEVELS;
     private bus;
     private contextManager;
@@ -49,6 +63,8 @@ export declare class AgentLoop implements AgentBackend {
     private thinkingLevel;
     private compositor;
     private toolProtocol;
+    private instanceId;
+    private lastShellSeq;
     constructor(config: AgentLoopConfig);
     /** Subscribe to bus events — activates this backend. */
     wire(): void;
@@ -60,13 +76,30 @@ export declare class AgentLoop implements AgentBackend {
     unregisterTool(name: string): void;
     /** Get all registered tools. */
     getTools(): ToolDefinition[];
+    /** Instructions keyed by name, with extension attribution. */
     private instructions;
+    /** Skills keyed by name, with extension attribution. */
+    private skills;
+    /** Tool → extension name attribution. */
+    private toolExtensions;
     /** Register a named instruction block for the system prompt. */
-    registerInstruction(name: string, text: string): void;
+    registerInstruction(name: string, text: string, extensionName: string): void;
     /** Remove a named instruction block. */
     removeInstruction(name: string): void;
-    /** Get instruction blocks registered by extensions. */
-    getInstructionSections(): string[];
+    /** Register a named skill (on-demand reference material). */
+    registerSkill(name: string, description: string, filePath: string, extensionName: string): void;
+    /** Remove a registered skill. */
+    removeSkill(name: string): void;
+    /**
+     * Build the system prompt grouped by extension.
+     *
+     * Each extension gets a unified block:
+     *   ## extension-name
+     *   ### Tools
+     *   ### Skills
+     *   ### Instructions
+     */
+    buildExtensionSections(): string[];
     kill(): void;
     private cancel;
     /** Check if reasoning_effort should be sent for the current model/provider. */
@@ -74,6 +107,12 @@ export declare class AgentLoop implements AgentBackend {
     private cycleMode;
     private get currentMode();
     private get currentModel();
+    /**
+     * Run compaction via the `conversation:compact` handler. After any
+     * compaction, emit `conversation:after-compact` so listeners
+     * (metrics, UI, agent-awareness notes) can react.
+     */
+    private compactWithHooks;
     private isContextOverflow;
     /** Check if an error is retryable (transient). */
     private isRetryable;
@@ -94,6 +133,7 @@ export declare class AgentLoop implements AgentBackend {
      */
     private executeLoop;
     private readonly maxRetries;
+    private filePathFromArgs;
     /**
      * Stream with retry logic. Handles:
      *   - Context overflow → compact and retry