npm - agent-sh - Versions diffs - 0.7.0 → 0.9.0 - Mend

agent-sh 0.7.0 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

package/README.md +28 -33
package/dist/agent/agent-loop.d.ts +31 -8
package/dist/agent/agent-loop.js +277 -66
package/dist/agent/conversation-state.d.ts +41 -9
package/dist/agent/conversation-state.js +340 -17
package/dist/agent/history-file.d.ts +36 -0
package/dist/agent/history-file.js +167 -0
package/dist/agent/nuclear-form.d.ts +41 -0
package/dist/agent/nuclear-form.js +176 -0
package/dist/agent/system-prompt.d.ts +4 -5
package/dist/agent/system-prompt.js +16 -11
package/dist/agent/token-budget.d.ts +13 -0
package/dist/agent/token-budget.js +50 -0
package/dist/agent/tool-protocol.d.ts +83 -0
package/dist/agent/tool-protocol.js +386 -0
package/dist/agent/tools/user-shell.js +4 -1
package/dist/agent/types.d.ts +21 -1
package/dist/context-manager.d.ts +0 -1
package/dist/context-manager.js +5 -110
package/dist/core.d.ts +7 -7
package/dist/core.js +76 -180
package/dist/event-bus.d.ts +40 -0
package/dist/event-bus.js +20 -1
package/dist/extension-loader.d.ts +5 -0
package/dist/extension-loader.js +104 -17
package/dist/extensions/agent-backend.d.ts +13 -0
package/dist/extensions/agent-backend.js +167 -0
package/dist/extensions/command-suggest.d.ts +3 -3
package/dist/extensions/command-suggest.js +4 -3
package/dist/extensions/index.d.ts +19 -0
package/dist/extensions/index.js +25 -0
package/dist/extensions/slash-commands.d.ts +1 -1
package/dist/extensions/slash-commands.js +44 -1
package/dist/extensions/terminal-buffer.d.ts +1 -1
package/dist/extensions/terminal-buffer.js +22 -8
package/dist/extensions/tui-renderer.js +177 -122
package/dist/index.js +14 -20
package/dist/settings.d.ts +25 -2
package/dist/settings.js +25 -4
package/dist/{input-handler.d.ts → shell/input-handler.d.ts} +1 -1
package/dist/{input-handler.js → shell/input-handler.js} +60 -43
package/dist/{output-parser.d.ts → shell/output-parser.d.ts} +1 -1
package/dist/{output-parser.js → shell/output-parser.js} +1 -1
package/dist/{shell.d.ts → shell/shell.d.ts} +8 -2
package/dist/{shell.js → shell/shell.js} +24 -6
package/dist/types.d.ts +49 -32
package/dist/utils/ansi.d.ts +10 -0
package/dist/utils/ansi.js +27 -0
package/dist/utils/compositor.d.ts +62 -0
package/dist/utils/compositor.js +88 -0
package/dist/utils/diff-renderer.js +92 -4
package/dist/utils/floating-panel.d.ts +34 -3
package/dist/utils/floating-panel.js +315 -82
package/dist/utils/handler-registry.d.ts +26 -10
package/dist/utils/handler-registry.js +52 -16
package/dist/utils/line-editor.d.ts +32 -3
package/dist/utils/line-editor.js +218 -36
package/dist/utils/markdown.d.ts +1 -0
package/dist/utils/markdown.js +4 -4
package/dist/utils/message-utils.d.ts +35 -0
package/dist/utils/message-utils.js +75 -0
package/dist/utils/terminal-buffer.d.ts +9 -1
package/dist/utils/terminal-buffer.js +31 -2
package/dist/utils/tool-display.d.ts +1 -0
package/dist/utils/tool-display.js +1 -1
package/dist/utils/tool-interactive.d.ts +12 -0
package/dist/utils/tool-interactive.js +53 -0
package/examples/extensions/ash-acp-bridge/README.md +39 -0
package/examples/extensions/ash-acp-bridge/package.json +23 -0
package/examples/extensions/ash-acp-bridge/src/index.ts +571 -0
package/examples/extensions/ash-acp-bridge/tsconfig.json +14 -0
package/examples/extensions/ash-mcp-bridge/README.md +72 -0
package/examples/extensions/ash-mcp-bridge/index.ts +154 -0
package/examples/extensions/ash-mcp-bridge/package.json +9 -0
package/examples/extensions/claude-code-bridge/index.ts +77 -1
package/examples/extensions/interactive-prompts.ts +82 -110
package/examples/extensions/overlay-agent.ts +84 -38
package/examples/extensions/peer-mesh.ts +450 -0
package/examples/extensions/pi-bridge/index.ts +87 -2
package/examples/extensions/questionnaire.ts +249 -0
package/examples/extensions/tmux-pane.ts +307 -0
package/examples/extensions/web-access.ts +327 -0
package/package.json +9 -1
package/dist/extensions/overlay-agent.d.ts +0 -11
package/dist/extensions/overlay-agent.js +0 -43
package/examples/extensions/terminal-buffer.ts +0 -184

package/README.md CHANGED Viewed

@@ -1,36 +1,22 @@
 # agent-sh
+An agent that lives in a shell — not a shell that lives in an agent.
 [![npm version](https://img.shields.io/npm/v/agent-sh.svg)](https://www.npmjs.com/package/agent-sh)
 [![license](https://img.shields.io/npm/l/agent-sh.svg)](https://github.com/guanyilun/agent-sh/blob/main/LICENSE)
-Not a shell that lives in an agent — an agent that lives in a shell.
-I live in a terminal. I don't want an agent that can run shell commands when it needs to — I want my shell, with an agent I can reach for when *I* need to. Most AI tools get this backwards: the LLM drives the experience and the shell is bolted on as an afterthought. No real PTY, no job control, no vim, fragile `cd` tracking. The agent is the main character and your terminal is a prop.
+Most AI terminal tools get this backwards: the LLM drives the experience and the shell is bolted on as an afterthought. No real PTY, no job control, no vim, fragile `cd` tracking. The agent is the main character and your terminal is a prop.
 agent-sh flips this. It's your shell first — full PTY, your rc config, your aliases, everything just works. But type `>` at the start of a line, and you're talking to an agent that has full context of what you've been doing.
 ```
-⚡ src $ ls -la                          # real shell command
-⚡ src $ cd ../tests && npm test          # real cd, env, aliases — all just work
-⚡ src $ vim file.ts                      # opens vim in the same PTY
-⚡ src $ > explain the last error          # agent investigates using its own tools
-⚡ src $ > deploy to staging              # agent runs it in your live shell
+~ $ ls -la                          # real shell command
+~ $ cd ../tests && npm test          # real cd, env, aliases — all just work
+~ $ vim file.ts                      # opens vim in the same PTY
+~ $ > explain the last error          # agent investigates using its own tools
+~ $ > deploy to staging              # agent runs it in your live shell
 ```
-## Key Features
-**Real terminal, zero compromise.** Full PTY with your shell config, aliases, and environment. Shell starts instantly — the agent connects asynchronously in the background.
-**Context-aware agent.** Every query includes your cwd, recent commands, and their output. Run a failing test, type `> fix this`, and the agent knows exactly what happened. It has built-in tools for file read/write/edit, bash, grep, glob — no external setup needed.
-**Agent decides how to help.** One entry point (`>`), three tool categories. The agent uses scratchpad tools to investigate, `display` to show you output, and `user_shell` for commands with lasting effects. No need to pick a mode — the agent reasons about which tools to use based on your intent.
-**Any LLM, any backend.** Works with any OpenAI-compatible API out of the box. Define multiple providers in settings and cycle between models at runtime with Shift+Tab. Or swap in a completely different agent — [Claude Code](examples/extensions/claude-code-bridge/) and [pi](examples/extensions/pi-bridge/) run as drop-in backend extensions.
-**Extensible by design.** The entire system is built on a typed event bus. Extensions can add custom input modes, content transforms (render LaTeX as images, Mermaid as diagrams), themes, slash commands, or replace the agent backend entirely. The built-in TUI renderer is itself just an extension — nothing is special.
-**Embeddable as a library.** The core is a headless kernel — `import { createCore } from "agent-sh"` to build WebSocket servers, REST APIs, Electron apps, or test harnesses. No terminal required.
 ## Quick Start
 ```bash
@@ -42,34 +28,43 @@ Set `OPENAI_API_KEY` in your environment (or configure providers in `~/.agent-sh
 Requires Node.js 18+.
-## Agent Mode
+## Key Features
-Type `>` at the start of a line to talk to the agent. The agent decides how to help:
+**Real terminal, zero compromise.** Full PTY with your shell config, aliases, and environment. Shell starts instantly — the agent connects asynchronously in the background.
-- **Scratchpad tools** (`bash`, `read_file`, `grep`, `glob`, etc.) — for investigation. Output goes to the agent, not your terminal.
-- **`display`** — shows output in your terminal (e.g. `cat`, `git log`). You see it; the agent doesn't process it.
-- **`user_shell`** — runs commands with lasting effects (`cd`, `npm install`, etc.) in your live shell.
+**One entry point, three tool categories.** Type `>` and agent-sh figures out how to help. Scratchpad tools (`bash`, `read_file`, `grep`, `glob`) for investigation. `display` to show you output. `user_shell` for commands with lasting effects in your live shell. No modes to pick — the agent reasons about which tools to use based on your intent.
-Everything else works as a normal shell — commands go straight to the PTY. Input modes are extensible — see [Extensions: Custom Input Modes](docs/extensions.md#custom-input-modes).
+**Context that just works.** Every query includes your cwd, recent commands, and their output. Run a failing test, type `> fix this`, and agent-sh knows exactly what happened. Context management works like shell history — continuous, persistent across restarts, no sessions to manage. See [Context Management](docs/context-management.md).
+**Any LLM, any backend.** agent-sh works with any OpenAI-compatible API out of the box. Define multiple providers in settings and cycle between models at runtime with Shift+Tab. Or swap in a completely different agent — [Claude Code](examples/extensions/claude-code-bridge/) and [pi](examples/extensions/pi-bridge/) run as drop-in backend extensions.
+**Extensible by design.** The entire system is built on a typed event bus. Extensions can add custom input modes, content transforms (render LaTeX as images, Mermaid as diagrams), themes, slash commands, or replace the agent backend entirely. The built-in TUI renderer is itself just an extension.
+**Embeddable as a library.** The core is a headless kernel — `import { createCore } from "agent-sh"` to build WebSocket servers, REST APIs, Electron apps, or test harnesses. No terminal required.
-### Slash Commands
+## Slash Commands
 | Command | Description |
 |---|---|
 | `/help` | Show available commands |
 | `/model [name]` | Cycle to the next model, or switch to a specific one |
 | `/backend [name]` | List backends, or switch to a named backend |
+| `/compact` | Compact conversation (free up context space) |
+| `/context` | Show context budget usage |
+| `/thinking [level]` | Set reasoning effort (off, low, medium, high) |
 ## Configuration
-Configure via `~/.agent-sh/settings.json`. See the [Usage Guide](docs/usage.md#configuration) for the full settings reference (providers, models, extensions, skills, and more).
+Configure via `~/.agent-sh/settings.json`. See the [Usage Guide](docs/usage.md#configuration) for the full settings reference.
 ## Documentation
-- [Usage Guide](docs/usage.md) — providers, models, configuration, provider profiles
-- [Internal Agent](docs/agent.md) — how the agent loop works: tools, context, streaming
-- [Architecture](docs/architecture.md) — design philosophy, component overview, project structure
+- [Usage Guide](docs/usage.md) — providers, models, configuration
+- [Internal Agent](docs/agent.md) — tools, context, streaming
+- [Context Management](docs/context-management.md) — three-tier history, token budget
+- [Architecture](docs/architecture.md) — design philosophy, component overview
 - [Extensions](docs/extensions.md) — event bus, content transforms, custom backends, theming
+- [TUI Composition](docs/tui-composition.md) — compositor, render surfaces, stream routing
 - [Library Usage](docs/library.md) — embedding agent-sh in your own apps
 - [Troubleshooting](docs/troubleshooting.md) — common errors and debug mode

package/dist/agent/agent-loop.d.ts CHANGED Viewed

@@ -16,32 +16,57 @@ import type { EventBus } from "../event-bus.js";
 import type { AgentMode } from "../types.js";
 import type { ContextManager } from "../context-manager.js";
 import type { LlmClient } from "../utils/llm-client.js";
-import type { HandlerRegistry } from "../utils/handler-registry.js";
+import type { HandlerFunctions } from "../utils/handler-registry.js";
 import type { AgentBackend, ToolDefinition } from "./types.js";
+import type { Compositor } from "../utils/compositor.js";
+export interface AgentLoopConfig {
+    bus: EventBus;
+    contextManager: ContextManager;
+    llmClient: LlmClient;
+    handlers: HandlerFunctions;
+    modes?: AgentMode[];
+    initialModeIndex?: number;
+    compositor?: Compositor;
+}
 export declare class AgentLoop implements AgentBackend {
-    private bus;
-    private contextManager;
-    private llmClient;
-    private handlers;
     private abortController;
     private toolRegistry;
+    private historyFile;
     private conversation;
     private fileReadCache;
+    private tokenBudget;
     private modes;
     private currentModeIndex;
     private boundListeners;
+    private ctorListeners;
+    private ctorPipeListeners;
     private lastProjectSkillNames;
     private static readonly THINKING_LEVELS;
+    private bus;
+    private contextManager;
+    private llmClient;
+    private handlers;
     private thinkingLevel;
-    constructor(bus: EventBus, contextManager: ContextManager, llmClient: LlmClient, handlers: HandlerRegistry, modeConfig?: AgentMode[], initialModeIndex?: number);
+    private compositor;
+    private toolProtocol;
+    constructor(config: AgentLoopConfig);
     /** Subscribe to bus events — activates this backend. */
     wire(): void;
     /** Unsubscribe from bus events — deactivates this backend. */
     unwire(): void;
     /** Register a tool (used by extensions via ctx.registerTool). */
     registerTool(tool: ToolDefinition): void;
+    /** Unregister a tool by name. */
+    unregisterTool(name: string): void;
     /** Get all registered tools. */
     getTools(): ToolDefinition[];
+    private instructions;
+    /** Register a named instruction block for the system prompt. */
+    registerInstruction(name: string, text: string): void;
+    /** Remove a named instruction block. */
+    removeInstruction(name: string): void;
+    /** Get instruction blocks registered by extensions. */
+    getInstructionSections(): string[];
     kill(): void;
     private cancel;
     /** Check if reasoning_effort should be sent for the current model/provider. */
@@ -63,8 +88,6 @@ export declare class AgentLoop implements AgentBackend {
      */
     private registerHandlers;
     private handleQuery;
-    /** Max tokens before auto-compaction (conservative default). */
-    private maxContextTokens;
     /**
      * Core agent loop: stream LLM response → execute tools → repeat.
      * Returns the final accumulated response text.