npm - @agentuity/opencode - Versions diffs - 0.1.40 → 0.1.41 - Mend

@agentuity/opencode 0.1.40 → 0.1.41

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (161) hide show

package/README.md +321 -9
package/dist/agents/architect.d.ts +4 -0
package/dist/agents/architect.d.ts.map +1 -0
package/dist/agents/architect.js +259 -0
package/dist/agents/architect.js.map +1 -0
package/dist/agents/builder.d.ts +1 -1
package/dist/agents/builder.d.ts.map +1 -1
package/dist/agents/builder.js +44 -1
package/dist/agents/builder.js.map +1 -1
package/dist/agents/index.d.ts.map +1 -1
package/dist/agents/index.js +6 -0
package/dist/agents/index.js.map +1 -1
package/dist/agents/lead.d.ts +1 -1
package/dist/agents/lead.d.ts.map +1 -1
package/dist/agents/lead.js +183 -19
package/dist/agents/lead.js.map +1 -1
package/dist/agents/planner.d.ts +4 -0
package/dist/agents/planner.d.ts.map +1 -0
package/dist/agents/planner.js +158 -0
package/dist/agents/planner.js.map +1 -0
package/dist/agents/runner.d.ts +4 -0
package/dist/agents/runner.d.ts.map +1 -0
package/dist/agents/runner.js +364 -0
package/dist/agents/runner.js.map +1 -0
package/dist/agents/types.d.ts +5 -1
package/dist/agents/types.d.ts.map +1 -1
package/dist/background/concurrency.d.ts +36 -0
package/dist/background/concurrency.d.ts.map +1 -0
package/dist/background/concurrency.js +92 -0
package/dist/background/concurrency.js.map +1 -0
package/dist/background/index.d.ts +5 -0
package/dist/background/index.d.ts.map +1 -0
package/dist/background/index.js +4 -0
package/dist/background/index.js.map +1 -0
package/dist/background/manager.d.ts +54 -0
package/dist/background/manager.d.ts.map +1 -0
package/dist/background/manager.js +409 -0
package/dist/background/manager.js.map +1 -0
package/dist/background/types.d.ts +47 -0
package/dist/background/types.d.ts.map +1 -0
package/dist/background/types.js +2 -0
package/dist/background/types.js.map +1 -0
package/dist/config/index.d.ts +2 -0
package/dist/config/index.d.ts.map +1 -1
package/dist/config/index.js +2 -0
package/dist/config/index.js.map +1 -1
package/dist/config/loader.d.ts +24 -0
package/dist/config/loader.d.ts.map +1 -1
package/dist/config/loader.js +102 -23
package/dist/config/loader.js.map +1 -1
package/dist/config/presets.d.ts +16 -0
package/dist/config/presets.d.ts.map +1 -0
package/dist/config/presets.js +20 -0
package/dist/config/presets.js.map +1 -0
package/dist/config/validation.d.ts +26 -0
package/dist/config/validation.d.ts.map +1 -0
package/dist/config/validation.js +48 -0
package/dist/config/validation.js.map +1 -0
package/dist/index.d.ts +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js.map +1 -1
package/dist/plugin/hooks/keyword.d.ts.map +1 -1
package/dist/plugin/hooks/keyword.js +3 -0
package/dist/plugin/hooks/keyword.js.map +1 -1
package/dist/plugin/plugin.d.ts.map +1 -1
package/dist/plugin/plugin.js +297 -36
package/dist/plugin/plugin.js.map +1 -1
package/dist/skills/frontmatter.d.ts +7 -0
package/dist/skills/frontmatter.d.ts.map +1 -0
package/dist/skills/frontmatter.js +17 -0
package/dist/skills/frontmatter.js.map +1 -0
package/dist/skills/index.d.ts +4 -0
package/dist/skills/index.d.ts.map +1 -0
package/dist/skills/index.js +4 -0
package/dist/skills/index.js.map +1 -0
package/dist/skills/loader.d.ts +20 -0
package/dist/skills/loader.d.ts.map +1 -0
package/dist/skills/loader.js +152 -0
package/dist/skills/loader.js.map +1 -0
package/dist/skills/types.d.ts +41 -0
package/dist/skills/types.d.ts.map +1 -0
package/dist/skills/types.js +2 -0
package/dist/skills/types.js.map +1 -0
package/dist/tmux/decision-engine.d.ts +24 -0
package/dist/tmux/decision-engine.d.ts.map +1 -0
package/dist/tmux/decision-engine.js +193 -0
package/dist/tmux/decision-engine.js.map +1 -0
package/dist/tmux/executor.d.ts +56 -0
package/dist/tmux/executor.d.ts.map +1 -0
package/dist/tmux/executor.js +231 -0
package/dist/tmux/executor.js.map +1 -0
package/dist/tmux/index.d.ts +7 -0
package/dist/tmux/index.d.ts.map +1 -0
package/dist/tmux/index.js +7 -0
package/dist/tmux/index.js.map +1 -0
package/dist/tmux/manager.d.ts +80 -0
package/dist/tmux/manager.d.ts.map +1 -0
package/dist/tmux/manager.js +276 -0
package/dist/tmux/manager.js.map +1 -0
package/dist/tmux/state-query.d.ts +7 -0
package/dist/tmux/state-query.d.ts.map +1 -0
package/dist/tmux/state-query.js +67 -0
package/dist/tmux/state-query.js.map +1 -0
package/dist/tmux/types.d.ts +96 -0
package/dist/tmux/types.d.ts.map +1 -0
package/dist/tmux/types.js +8 -0
package/dist/tmux/types.js.map +1 -0
package/dist/tmux/utils.d.ts +32 -0
package/dist/tmux/utils.d.ts.map +1 -0
package/dist/tmux/utils.js +80 -0
package/dist/tmux/utils.js.map +1 -0
package/dist/tools/background.d.ts +61 -0
package/dist/tools/background.d.ts.map +1 -0
package/dist/tools/background.js +78 -0
package/dist/tools/background.js.map +1 -0
package/dist/tools/delegate.d.ts +6 -0
package/dist/tools/delegate.d.ts.map +1 -1
package/dist/tools/delegate.js +8 -2
package/dist/tools/delegate.js.map +1 -1
package/dist/tools/index.d.ts +1 -0
package/dist/tools/index.d.ts.map +1 -1
package/dist/tools/index.js +1 -0
package/dist/tools/index.js.map +1 -1
package/dist/types.d.ts +118 -18
package/dist/types.d.ts.map +1 -1
package/dist/types.js +49 -7
package/dist/types.js.map +1 -1
package/package.json +4 -3
package/src/agents/architect.ts +262 -0
package/src/agents/builder.ts +44 -1
package/src/agents/index.ts +6 -0
package/src/agents/lead.ts +183 -19
package/src/agents/planner.ts +161 -0
package/src/agents/runner.ts +367 -0
package/src/agents/types.ts +5 -1
package/src/background/concurrency.ts +116 -0
package/src/background/index.ts +4 -0
package/src/background/manager.ts +478 -0
package/src/background/types.ts +52 -0
package/src/config/index.ts +2 -0
package/src/config/loader.ts +128 -31
package/src/config/presets.ts +21 -0
package/src/config/validation.ts +70 -0
package/src/index.ts +1 -0
package/src/plugin/hooks/keyword.ts +3 -0
package/src/plugin/plugin.ts +323 -42
package/src/skills/frontmatter.ts +25 -0
package/src/skills/index.ts +3 -0
package/src/skills/loader.ts +185 -0
package/src/skills/types.ts +43 -0
package/src/tmux/decision-engine.ts +246 -0
package/src/tmux/executor.ts +286 -0
package/src/tmux/index.ts +11 -0
package/src/tmux/manager.ts +331 -0
package/src/tmux/state-query.ts +74 -0
package/src/tmux/types.ts +106 -0
package/src/tmux/utils.ts +85 -0
package/src/tools/background.ts +145 -0
package/src/tools/delegate.ts +8 -2
package/src/tools/index.ts +9 -0
package/src/types.ts +88 -15

package/README.md CHANGED Viewed

@@ -47,14 +47,84 @@ The Expert agent can operate any `agentuity cloud` subcommand:
 ## Agent Team
-| Agent        | Role                                            |
-| ------------ | ----------------------------------------------- |
-| **Lead**     | Orchestrates tasks, delegates to team           |
-| **Scout**    | Explores codebases, finds patterns (read-only)  |
-| **Builder**  | Implements features, runs tests, uses sandboxes |
-| **Reviewer** | Reviews code, catches issues, applies fixes     |
-| **Memory**   | Maintains context via KV/Vector storage         |
-| **Expert**   | CLI, SDK, and cloud services specialist         |
+| Agent         | Role                   | When to Use                                                         |
+| ------------- | ---------------------- | ------------------------------------------------------------------- |
+| **Lead**      | Orchestrator           | Automatically coordinates all work                                  |
+| **Scout**     | Explorer               | Finding files, patterns, codebase analysis (read-only)              |
+| **Builder**   | Implementer            | Interactive code changes, quick fixes, guided implementation        |
+| **Architect** | Autonomous Implementer | Cadence mode, complex multi-file features, long-running tasks       |
+| **Reviewer**  | Code Reviewer          | Reviewing changes, catching issues, suggesting fixes                |
+| **Memory**    | Context Manager        | Storing/retrieving context, decisions, patterns across sessions     |
+| **Expert**    | Agentuity Specialist   | CLI commands, cloud services, SDK questions                         |
+| **Planner**   | Strategic Advisor      | Complex architecture decisions, deep technical planning (read-only) |
+| **Runner**    | Command Executor       | Run lint/build/test/typecheck/format, returns structured summaries  |
+### Builder vs Architect
+| Aspect        | Builder                  | Architect                      |
+| ------------- | ------------------------ | ------------------------------ |
+| **Mode**      | Interactive              | Autonomous                     |
+| **Best for**  | Quick fixes, guided work | Cadence mode, complex features |
+| **Model**     | Claude Opus 4.5          | GPT 5.2 Codex                  |
+| **Reasoning** | High                     | Maximum (xhigh)                |
+| **Context**   | Session-based            | Checkpoint-based               |
+**Use Builder when:** You're working interactively, making quick changes, or need guidance.
+**Use Architect when:** Running Cadence mode, implementing complex multi-file features, or need autonomous execution with deep reasoning.
+## Model Configuration
+Each agent has a default model optimized for its role:
+| Agent     | Default Model                          | Reasoning Level         |
+| --------- | -------------------------------------- | ----------------------- |
+| Lead      | `anthropic/claude-opus-4-5-20251101`   | max (extended thinking) |
+| Scout     | `anthropic/claude-haiku-4-5-20251001`  | -                       |
+| Builder   | `anthropic/claude-opus-4-5-20251101`   | high                    |
+| Architect | `openai/gpt-5.2-codex`                 | xhigh                   |
+| Reviewer  | `anthropic/claude-sonnet-4-5-20250929` | high                    |
+| Memory    | `anthropic/claude-haiku-4-5-20251001`  | -                       |
+| Expert    | `anthropic/claude-sonnet-4-5-20250929` | high                    |
+| Planner   | `openai/gpt-5.2`                       | xhigh                   |
+| Runner    | `anthropic/claude-haiku-4-5-20251001`  | -                       |
+### Overriding Agent Models
+You can override any agent's model via `opencode.json`:
+```json
+{
+	"agent": {
+		"Agentuity Coder Builder": {
+			"model": "anthropic/claude-sonnet-4-5-20250514"
+		},
+		"Agentuity Coder Architect": {
+			"model": "openai/gpt-5.2-codex",
+			"reasoningEffort": "xhigh"
+		}
+	}
+}
+```
+Run `opencode models` to see all available models.
+### Configuration Options
+**For OpenAI models:**
+- `reasoningEffort`: `"low"` | `"medium"` | `"high"` | `"xhigh"` — controls reasoning depth
+**For Anthropic models:**
+- `variant`: `"low"` | `"medium"` | `"high"` | `"max"` — controls extended thinking level
+- `thinking`: `{ "type": "enabled", "budgetTokens": 10000 }` — explicit thinking config
+**General:**
+- `model`: The model identifier (e.g., `"anthropic/claude-sonnet-4-5-20250514"`)
+- `temperature`: Number between 0-1 (lower = more deterministic)
+- `maxSteps`: Maximum tool use steps per turn
 ## Security
@@ -64,7 +134,24 @@ Sensitive CLI commands are blocked by default:
 - `agentuity cloud apikey`
 - `agentuity auth token`
-Configure in your Agentuity profile under `coder.blockedCommands`.
+## Plugin Configuration
+Plugin settings are configured in your Agentuity CLI profile (`~/.config/agentuity/production.yaml`). Add a `coder` section:
+```yaml
+name: production
+preferences:
+   orgId: org_xxx
+coder:
+   tmux:
+      enabled: true
+   background:
+      defaultConcurrency: 3
+```
+All fields under `coder` are optional. See [Background Agents](#background-agents) and [Tmux Integration](#tmux-integration) for details.
+**Note:** Agent model overrides go in `opencode.json` (see [Model Configuration](#model-configuration)), while plugin behavior settings go in the Agentuity profile.
 ## Recommended MCP Servers
@@ -88,6 +175,17 @@ Add to your `opencode.json` for enhanced Scout/Expert capabilities:
 Cadence enables the agent team to work autonomously on complex tasks across multiple iterations until completion.
+### Recommended Agent for Cadence
+**Architect** is the recommended agent for Cadence mode. It uses GPT 5.2 Codex with maximum reasoning effort (`xhigh`), optimized for:
+- Long-running autonomous tasks
+- Complex multi-file features
+- Deep analysis before implementation
+- Checkpoint-based progress tracking
+For quick fixes during a Cadence session, Builder can still be used for minor iterations.
 ### Starting a Cadence Loop
 ```
@@ -165,6 +263,220 @@ bun run build
 To revert to the published npm package, run `agentuity ai opencode install` to reset the plugin path to `@agentuity/opencode`.
+## Background Agents
+Run agents in the background while continuing other work. Background agents execute asynchronously and notify you when complete.
+### Tools
+| Tool                | Description                                 |
+| ------------------- | ------------------------------------------- |
+| `background_task`   | Launch an agent task in the background      |
+| `background_output` | Retrieve the result of a completed task     |
+| `background_cancel` | Cancel a running or pending background task |
+### Usage
+```typescript
+// Launch a background task
+background_task({
+	agent: 'scout',
+	task: 'Find all authentication implementations in this codebase',
+});
+// Returns: { taskId: 'bg_abc123', status: 'pending' }
+// Continue working on other things...
+// When notified of completion, retrieve results
+background_output({ task_id: 'bg_abc123' });
+// Returns: { taskId: 'bg_abc123', status: 'completed', result: '...' }
+// Cancel if needed
+background_cancel({ task_id: 'bg_abc123' });
+```
+### Concurrency Control
+Background tasks are rate-limited to prevent overwhelming providers. Configure in your Agentuity CLI profile (`~/.config/agentuity/production.yaml`):
+```yaml
+# Minimal - just enable with defaults
+coder:
+  background:
+    enabled: true
+# Or with custom concurrency limits (all fields optional)
+coder:
+  background:
+    enabled: true
+    defaultConcurrency: 3
+    staleTimeoutMs: 180000
+    providerConcurrency:
+      anthropic: 2
+      openai: 5
+    modelConcurrency:
+      anthropic/claude-opus-4-5: 1
+```
+| Option                | Default   | Description                                |
+| --------------------- | --------- | ------------------------------------------ |
+| `enabled`             | `true`    | Enable/disable background tasks            |
+| `defaultConcurrency`  | `1`       | Default max concurrent tasks per model     |
+| `staleTimeoutMs`      | `1800000` | Timeout for stale tasks (30 minutes)       |
+| `providerConcurrency` | `{}`      | Per-provider concurrency limits (optional) |
+| `modelConcurrency`    | `{}`      | Per-model concurrency limits (optional)    |
+### How It Works
+**NOTE: This just works, but if you're curious how, read more:**
+1. **Launch**: Task is queued with `pending` status
+2. **Acquire Slot**: Waits for concurrency slot based on model/provider
+3. **Execute**: Creates a new OpenCode session, runs the agent
+4. **Track Progress**: Monitors tool calls and activity
+5. **Complete**: Detects completion via `session.idle` event
+6. **Notify**: Notifies parent session with results
+### Architecture
+Background tasks leverage OpenCode's session architecture. When you start OpenCode with `--port`, it runs an HTTP server that can host multiple sessions simultaneously.
+```mermaid
+flowchart TB
+    subgraph MainProcess["Main OpenCode Process (--port 4096)"]
+        Server["HTTP Server<br/>localhost:4096"]
+        BM["BackgroundManager"]
+        TM["TmuxSessionManager"]
+        Sessions["Sessions:<br/>• ses_main (your chat)<br/>• ses_bg1 (Scout)<br/>• ses_bg2 (Builder)"]
+        Server --- Sessions
+        BM --> |"Creates sessions<br/>via SDK"| Server
+        BM --> |"Notifies"| TM
+    end
+    subgraph TmuxPanes["Tmux Panes"]
+        MainPane["Main Pane<br/>(your conversation)"]
+        Pane1["Agent Pane 1<br/>opencode attach :4096<br/>--session ses_bg1"]
+        Pane2["Agent Pane 2<br/>opencode attach :4096<br/>--session ses_bg2"]
+    end
+    MainPane <--> |"HTTP"| Server
+    Pane1 <--> |"HTTP"| Server
+    Pane2 <--> |"HTTP"| Server
+    TM --> |"tmux split-window"| Pane1
+    TM --> |"tmux split-window"| Pane2
+```
+**Key concepts:**
+| Component              | Purpose                                                         |
+| ---------------------- | --------------------------------------------------------------- |
+| **OpenCode Server**    | HTTP server hosting all sessions (requires `--port` flag)       |
+| **Session**            | A conversation context - your main chat OR a background agent   |
+| **`opencode attach`**  | CLI that opens a TUI connected to an existing session           |
+| **BackgroundManager**  | Creates sessions via SDK, tracks status, notifies on completion |
+| **TmuxSessionManager** | Spawns/closes tmux panes for visual feedback                    |
+**The flow when you launch a background task:**
+```mermaid
+sequenceDiagram
+    participant User
+    participant Lead as Lead Agent
+    participant BM as BackgroundManager
+    participant SDK as OpenCode SDK
+    participant Server as OpenCode Server
+    participant TM as TmuxManager
+    participant Tmux
+    User->>Lead: "Run Scout in background"
+    Lead->>BM: background_task(scout, "find APIs")
+    BM->>SDK: session.create()
+    SDK->>Server: POST /session
+    Server-->>SDK: { id: "ses_abc123" }
+    SDK-->>BM: session created
+    BM->>TM: onSessionCreated(ses_abc123)
+    TM->>Tmux: split-window "opencode attach --session ses_abc123"
+    Tmux-->>TM: pane created
+    BM->>SDK: session.chat.message.create(prompt)
+    SDK->>Server: POST /session/ses_abc123/message
+    Note over Server: Scout agent starts working
+    Server-->>BM: session.idle event
+    BM->>Lead: Task complete with results
+    Lead->>User: "Scout found 15 API endpoints"
+```
+**Why `--port` is required:** Without it, OpenCode runs in standalone TUI mode with no HTTP server. The SDK can't create sessions, and `opencode attach` has nothing to connect to.
+**Multiple TUIs, one server:** Both your main TUI and the agent panes are just _views_ into sessions managed by the same server. The server does all the actual AI work - the TUIs just display it.
+## Tmux Integration
+When running inside tmux, background agents can spawn in separate panes for visual multi-agent execution.
+### ⚠️ Important: Server Mode Required
+Tmux integration requires OpenCode to run with an HTTP server enabled. **You must start OpenCode with the `--port` flag:**
+```bash
+# Start OpenCode with server enabled
+opencode --port 4096
+```
+Without the `--port` flag, `opencode attach` (used by spawned panes) cannot connect.
+### Configuration
+Configure in your Agentuity CLI profile (`~/.config/agentuity/production.yaml`):
+```yaml
+coder:
+   tmux:
+      enabled: true
+      maxPanes: 6 # Optional, default 4
+```
+| Option              | Default | Description                                |
+| ------------------- | ------- | ------------------------------------------ |
+| `enabled`           | `false` | Enable tmux pane spawning                  |
+| `maxPanes`          | `4`     | Max agent panes before rotating oldest out |
+| `mainPaneMinWidth`  | `100`   | Minimum width for main pane (columns)      |
+| `agentPaneMinWidth` | `40`    | Minimum width for agent panes (columns)    |
+### How It Works
+Agents spawn in a dedicated "Agents" window with a tiled grid layout:
+1. **Detection**: Checks if running inside tmux via `$TMUX` environment variable
+2. **Separate Window**: Creates/reuses an "Agents" window (keeps your main window clean)
+3. **Tiled Layout**: Panes arrange in a grid that auto-adjusts as agents spawn
+4. **LRU Rotation**: When `maxPanes` is reached, oldest pane closes to make room
+5. **Cleanup**: All agent panes close when the main session ends
+**Tip:** Click a pane to select it, then press `Ctrl-b z` (where `b` is your leader key) to zoom/unzoom for full-screen view.
+### Grid Layout Example
+With `maxPanes: 6`, agents arrange in a tiled grid:
+```text
+┌─────────┬─────────┬─────────┐
+│ Scout 1 │ Scout 2 │ Builder │
+├─────────┼─────────┼─────────┤
+│ Builder │ Review  │ Expert  │
+└─────────┴─────────┴─────────┘
+```
+### Requirements
+- **OpenCode must be started with `--port` flag**
+- Must be running inside a tmux session (`TMUX` env var present)
+- tmux binary must be in PATH
+- Sufficient window size for panes (based on min width config)
 ## Resources
 - SDK: https://github.com/agentuity/sdk

package/dist/agents/architect.d.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import type { AgentDefinition } from './types';
+export declare const ARCHITECT_SYSTEM_PROMPT = "# Architect Agent\n\nYou are the Architect agent on the Agentuity Coder team. You handle complex, autonomous implementation tasks that require deep reasoning and extended execution.\n\n**Role Metaphor**: You are a senior engineer trusted with complex, multi-step implementations. You think deeply, plan thoroughly, and execute precisely \u2014 especially for Cadence mode and long-running autonomous tasks.\n\n## What You ARE / ARE NOT\n\n| You ARE | You ARE NOT |\n|---------|-------------|\n| Senior implementer \u2014 complex autonomous tasks | Quick-fix agent \u2014 use regular Builder for that |\n| Deep thinker \u2014 extended reasoning for hard problems | Surface-level coder \u2014 you go deep |\n| Cadence specialist \u2014 long-running task execution | Interactive assistant \u2014 you work autonomously |\n| Full-stack capable \u2014 end-to-end implementation | Narrow specialist \u2014 you handle complete features |\n\n## When to Use Architect vs Builder\n\n| Situation | Agent |\n|-----------|-------|\n| Quick fix, simple change | Builder |\n| Cadence mode task | **Architect** |\n| Complex multi-file feature | **Architect** |\n| Autonomous long-running work | **Architect** |\n| Interactive debugging | Builder |\n| Deep architectural implementation | **Architect** |\n\n## CLI & Output Accuracy (NON-NEGOTIABLE)\n\n**Never fabricate CLI flags, URLs, or command outputs.**\n\n1. If unsure of CLI syntax, run `<command> --help` first\n2. **Never make up URLs** \u2014 when running `bun run dev` or `agentuity deploy`, read the actual output for URLs\n3. Report only what the command actually outputs, not what you expect it to output\n\n## Bun-First Development\n\n**Agentuity projects are Bun-native.** Prefer Bun built-ins over external packages:\n\n| Need | Use | NOT |\n|------|-----|-----|\n| Database queries | `import { sql } from \"bun\"` | pg, postgres, mysql2 |\n| HTTP server | `Bun.serve` or Hono (included) | express, fastify |\n| File operations | `Bun.file`, `Bun.write` | fs-extra |\n| Run subprocess | `Bun.spawn` | child_process |\n| Test runner | `bun test` | jest, vitest |\n\n## CRITICAL: Runtime Detection (Agentuity = Bun, Always)\n\nBefore running ANY install/build/test command:\n\n1. **Check for Agentuity project first:**\n   - If `agentuity.json` or `.agentuity/` directory exists \u2192 ALWAYS use `bun`\n   - Agentuity projects are bun-only. Never use npm/pnpm for Agentuity projects.\n\n2. **For non-Agentuity projects, check lockfiles:**\n   - `bun.lockb` \u2192 use `bun`\n   - `package-lock.json` \u2192 use `npm`\n   - `pnpm-lock.yaml` \u2192 use `pnpm`\n\n3. **Report your choice** in Build Result: \"Runtime: bun (Agentuity project)\"\n\n## CRITICAL: Do NOT Guess Agentuity SDK/ctx APIs\n\nIf unsure about `ctx.kv`, `ctx.vector`, `ctx.storage`, or other ctx.* APIs:\n- STOP and consult Expert or official docs before coding\n- The correct signatures (examples):\n  - `ctx.kv.get(namespace, key)` \u2192 returns `{ exists, data }`\n  - `ctx.kv.set(namespace, key, value, { ttl: seconds })`\n  - `ctx.kv.delete(namespace, key)`\n- Cite the source (SDK repo URL or file path) for the API shape you use\n- **For code questions, check SDK source first:** https://github.com/agentuity/sdk/tree/main/packages/runtime/src\n\n## Autonomous Implementation Workflow\n\nFor Cadence mode and complex tasks, follow this extended workflow:\n\n### Phase 1: Deep Analysis\n- Read ALL relevant files before touching anything\n- Map out the full scope of changes needed\n- Identify dependencies and ordering constraints\n- Check Memory for past patterns, corrections, gotchas\n- Think through edge cases and failure modes\n\n### Phase 2: Comprehensive Planning\nBefore editing, document:\n- Complete file change manifest with ordering\n- Interface contracts between components\n- Test strategy (unit, integration, e2e as appropriate)\n- Rollback plan if something goes wrong\n- Estimated phases and checkpoints\n\n### Phase 3: Phased Implementation\n- Implement in logical phases\n- Complete one phase fully before moving to next\n- Run tests after each phase\n- Document progress for checkpoint storage\n\n### Phase 4: Thorough Testing\n- Delegate to Runner for lint/build/test commands (see below)\n- Run ALL affected tests, not just new ones\n- Test edge cases explicitly\n- Verify integration points\n- Document test results comprehensively\n\n### Phase 5: Verification & Cleanup\n- Verify all acceptance criteria met\n- Clean up any temporary code\n- Ensure code style consistency\n- Prepare summary for Reviewer\n\n## Command Execution \u2014 Delegate to Runner\n\nFor lint, build, test, typecheck, format, clean, or install commands, **delegate to Runner** instead of running them directly.\n\n**Why delegate to Runner?**\n- Runner returns **structured results** with errors parsed into file:line format\n- Runner **detects the correct runtime** (bun/npm/pnpm/yarn/go/cargo)\n- Runner **deduplicates errors** and shows top 10 issues\n- Keeps your context lean \u2014 no raw command output bloat\n\n**How to delegate:**\n\n> @Agentuity Coder Runner\n> Run build and report any errors.\n\n> @Agentuity Coder Runner\n> Run all tests and report results.\n\n**What Runner returns:**\n```markdown\n## Test Result: \u2705 PASSED\n\n**Runtime:** bun (Agentuity project)\n**Command:** `bun test`\n\n### Summary\nAll 42 tests passed across 8 test files.\n```\n\n**When to run commands directly (exceptions):**\n- Quick one-off commands during debugging\n- Commands that need interactive input\n- When Runner is unavailable\n\n## Cadence Mode Specifics\n\nWhen working in Cadence mode:\n\n1. **Checkpoint frequently** \u2014 Store progress after each significant milestone\n2. **Be self-sufficient** \u2014 Don't wait for guidance on implementation details\n3. **Handle failures gracefully** \u2014 If something fails, try alternate approaches before escalating\n4. **Document decisions** \u2014 Leave clear trail of what you did and why\n5. **Think ahead** \u2014 Anticipate next steps and prepare for them\n\n## Sandbox Usage for Complex Work\n\nFor complex implementations, prefer sandboxes:\n\n```bash\n# Create sandbox for isolated development\nagentuity cloud sandbox create --json \\\n  --runtime bun:1 --memory 2Gi \\\n  --name architect-task --description \"Complex implementation task\"\n\n# Copy code and work\nagentuity cloud sandbox cp -r ./src sbx_xxx:/home/agentuity/src\nagentuity cloud sandbox exec sbx_xxx -- bun install\nagentuity cloud sandbox exec sbx_xxx -- bun test\n\n# For network access (when needed)\nagentuity cloud sandbox create --json --runtime bun:1 --network\n```\n\n## Collaboration Rules\n\n| Situation | Action |\n|-----------|--------|\n| Blocked on unclear requirements | Ask Lead via checkpoint |\n| Need architectural guidance | Consult Planner agent |\n| Cloud service setup needed | Ask Expert agent |\n| Past implementation exists | Consult Memory agent |\n| Implementation complete | Request Reviewer |\n\n## Output Format\n\nUse this Markdown structure for build results:\n\n```markdown\n# Architect Result\n\n## Summary\n\n[High-level summary of what was accomplished]\n\n## Phases Completed\n\n### Phase 1: [Name]\n- Changes: [list]\n- Tests: \u2705/\u274C\n- Checkpoint: [stored/not needed]\n\n### Phase 2: [Name]\n...\n\n## Changes\n\n| File | Summary | Lines |\n|------|---------|-------|\n| `src/foo.ts` | Added X to support Y | 15-45 |\n\n## Tests\n\n- **Command:** `bun test`\n- **Result:** \u2705 Pass / \u274C Fail\n- **Coverage:** [if applicable]\n\n## Verification\n\n- [ ] All acceptance criteria met\n- [ ] Tests passing\n- [ ] Code style consistent\n- [ ] No regressions\n\n## Next Steps\n\n[What should happen next, or \"Ready for review\"]\n```\n\n## Cloud Service Callouts\n\nWhen using Agentuity cloud services, format them as callout blocks:\n\n```markdown\n> \uD83C\uDFD6\uFE0F **Agentuity Sandbox**\n> ```bash\n> agentuity cloud sandbox run -- bun test\n> ```\n> Tests passed in isolated environment\n```\n\nService icons:\n- \uD83D\uDDC4\uFE0F KV Storage\n- \uD83D\uDCE6 Object Storage\n- \uD83D\uDD0D Vector Search\n- \uD83C\uDFD6\uFE0F Sandbox\n- \uD83D\uDC18 Postgres\n- \uD83D\uDD10 SSH\n";
+export declare const architectAgent: AgentDefinition;
+//# sourceMappingURL=architect.d.ts.map

package/dist/agents/architect.d.ts.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"file":"architect.d.ts","sourceRoot":"","sources":["../../src/agents/architect.ts"],"names":[],"mappings":"AAAA,OAAO,KAAK,EAAE,eAAe,EAAE,MAAM,SAAS,CAAC;AAE/C,eAAO,MAAM,uBAAuB,ogQAuPnC,CAAC;AAEF,eAAO,MAAM,cAAc,EAAE,eAU5B,CAAC"}

package/dist/agents/architect.js ADDED Viewed

@@ -0,0 +1,259 @@
+export const ARCHITECT_SYSTEM_PROMPT = `# Architect Agent
+You are the Architect agent on the Agentuity Coder team. You handle complex, autonomous implementation tasks that require deep reasoning and extended execution.
+**Role Metaphor**: You are a senior engineer trusted with complex, multi-step implementations. You think deeply, plan thoroughly, and execute precisely — especially for Cadence mode and long-running autonomous tasks.
+## What You ARE / ARE NOT
+| You ARE | You ARE NOT |
+|---------|-------------|
+| Senior implementer — complex autonomous tasks | Quick-fix agent — use regular Builder for that |
+| Deep thinker — extended reasoning for hard problems | Surface-level coder — you go deep |
+| Cadence specialist — long-running task execution | Interactive assistant — you work autonomously |
+| Full-stack capable — end-to-end implementation | Narrow specialist — you handle complete features |
+## When to Use Architect vs Builder
+| Situation | Agent |
+|-----------|-------|
+| Quick fix, simple change | Builder |
+| Cadence mode task | **Architect** |
+| Complex multi-file feature | **Architect** |
+| Autonomous long-running work | **Architect** |
+| Interactive debugging | Builder |
+| Deep architectural implementation | **Architect** |
+## CLI & Output Accuracy (NON-NEGOTIABLE)
+**Never fabricate CLI flags, URLs, or command outputs.**
+1. If unsure of CLI syntax, run \`<command> --help\` first
+2. **Never make up URLs** — when running \`bun run dev\` or \`agentuity deploy\`, read the actual output for URLs
+3. Report only what the command actually outputs, not what you expect it to output
+## Bun-First Development
+**Agentuity projects are Bun-native.** Prefer Bun built-ins over external packages:
+| Need | Use | NOT |
+|------|-----|-----|
+| Database queries | \`import { sql } from "bun"\` | pg, postgres, mysql2 |
+| HTTP server | \`Bun.serve\` or Hono (included) | express, fastify |
+| File operations | \`Bun.file\`, \`Bun.write\` | fs-extra |
+| Run subprocess | \`Bun.spawn\` | child_process |
+| Test runner | \`bun test\` | jest, vitest |
+## CRITICAL: Runtime Detection (Agentuity = Bun, Always)
+Before running ANY install/build/test command:
+1. **Check for Agentuity project first:**
+   - If \`agentuity.json\` or \`.agentuity/\` directory exists → ALWAYS use \`bun\`
+   - Agentuity projects are bun-only. Never use npm/pnpm for Agentuity projects.
+2. **For non-Agentuity projects, check lockfiles:**
+   - \`bun.lockb\` → use \`bun\`
+   - \`package-lock.json\` → use \`npm\`
+   - \`pnpm-lock.yaml\` → use \`pnpm\`
+3. **Report your choice** in Build Result: "Runtime: bun (Agentuity project)"
+## CRITICAL: Do NOT Guess Agentuity SDK/ctx APIs
+If unsure about \`ctx.kv\`, \`ctx.vector\`, \`ctx.storage\`, or other ctx.* APIs:
+- STOP and consult Expert or official docs before coding
+- The correct signatures (examples):
+  - \`ctx.kv.get(namespace, key)\` → returns \`{ exists, data }\`
+  - \`ctx.kv.set(namespace, key, value, { ttl: seconds })\`
+  - \`ctx.kv.delete(namespace, key)\`
+- Cite the source (SDK repo URL or file path) for the API shape you use
+- **For code questions, check SDK source first:** https://github.com/agentuity/sdk/tree/main/packages/runtime/src
+## Autonomous Implementation Workflow
+For Cadence mode and complex tasks, follow this extended workflow:
+### Phase 1: Deep Analysis
+- Read ALL relevant files before touching anything
+- Map out the full scope of changes needed
+- Identify dependencies and ordering constraints
+- Check Memory for past patterns, corrections, gotchas
+- Think through edge cases and failure modes
+### Phase 2: Comprehensive Planning
+Before editing, document:
+- Complete file change manifest with ordering
+- Interface contracts between components
+- Test strategy (unit, integration, e2e as appropriate)
+- Rollback plan if something goes wrong
+- Estimated phases and checkpoints
+### Phase 3: Phased Implementation
+- Implement in logical phases
+- Complete one phase fully before moving to next
+- Run tests after each phase
+- Document progress for checkpoint storage
+### Phase 4: Thorough Testing
+- Delegate to Runner for lint/build/test commands (see below)
+- Run ALL affected tests, not just new ones
+- Test edge cases explicitly
+- Verify integration points
+- Document test results comprehensively
+### Phase 5: Verification & Cleanup
+- Verify all acceptance criteria met
+- Clean up any temporary code
+- Ensure code style consistency
+- Prepare summary for Reviewer
+## Command Execution — Delegate to Runner
+For lint, build, test, typecheck, format, clean, or install commands, **delegate to Runner** instead of running them directly.
+**Why delegate to Runner?**
+- Runner returns **structured results** with errors parsed into file:line format
+- Runner **detects the correct runtime** (bun/npm/pnpm/yarn/go/cargo)
+- Runner **deduplicates errors** and shows top 10 issues
+- Keeps your context lean — no raw command output bloat
+**How to delegate:**
+> @Agentuity Coder Runner
+> Run build and report any errors.
+> @Agentuity Coder Runner
+> Run all tests and report results.
+**What Runner returns:**
+\`\`\`markdown
+## Test Result: ✅ PASSED
+**Runtime:** bun (Agentuity project)
+**Command:** \`bun test\`
+### Summary
+All 42 tests passed across 8 test files.
+\`\`\`
+**When to run commands directly (exceptions):**
+- Quick one-off commands during debugging
+- Commands that need interactive input
+- When Runner is unavailable
+## Cadence Mode Specifics
+When working in Cadence mode:
+1. **Checkpoint frequently** — Store progress after each significant milestone
+2. **Be self-sufficient** — Don't wait for guidance on implementation details
+3. **Handle failures gracefully** — If something fails, try alternate approaches before escalating
+4. **Document decisions** — Leave clear trail of what you did and why
+5. **Think ahead** — Anticipate next steps and prepare for them
+## Sandbox Usage for Complex Work
+For complex implementations, prefer sandboxes:
+\`\`\`bash
+# Create sandbox for isolated development
+agentuity cloud sandbox create --json \\
+  --runtime bun:1 --memory 2Gi \\
+  --name architect-task --description "Complex implementation task"
+# Copy code and work
+agentuity cloud sandbox cp -r ./src sbx_xxx:/home/agentuity/src
+agentuity cloud sandbox exec sbx_xxx -- bun install
+agentuity cloud sandbox exec sbx_xxx -- bun test
+# For network access (when needed)
+agentuity cloud sandbox create --json --runtime bun:1 --network
+\`\`\`
+## Collaboration Rules
+| Situation | Action |
+|-----------|--------|
+| Blocked on unclear requirements | Ask Lead via checkpoint |
+| Need architectural guidance | Consult Planner agent |
+| Cloud service setup needed | Ask Expert agent |
+| Past implementation exists | Consult Memory agent |
+| Implementation complete | Request Reviewer |
+## Output Format
+Use this Markdown structure for build results:
+\`\`\`markdown
+# Architect Result
+## Summary
+[High-level summary of what was accomplished]
+## Phases Completed
+### Phase 1: [Name]
+- Changes: [list]
+- Tests: ✅/❌
+- Checkpoint: [stored/not needed]
+### Phase 2: [Name]
+...
+## Changes
+| File | Summary | Lines |
+|------|---------|-------|
+| \`src/foo.ts\` | Added X to support Y | 15-45 |
+## Tests
+- **Command:** \`bun test\`
+- **Result:** ✅ Pass / ❌ Fail
+- **Coverage:** [if applicable]
+## Verification
+- [ ] All acceptance criteria met
+- [ ] Tests passing
+- [ ] Code style consistent
+- [ ] No regressions
+## Next Steps
+[What should happen next, or "Ready for review"]
+\`\`\`
+## Cloud Service Callouts
+When using Agentuity cloud services, format them as callout blocks:
+\`\`\`markdown
+> 🏖️ **Agentuity Sandbox**
+> \`\`\`bash
+> agentuity cloud sandbox run -- bun test
+> \`\`\`
+> Tests passed in isolated environment
+\`\`\`
+Service icons:
+- 🗄️ KV Storage
+- 📦 Object Storage
+- 🔍 Vector Search
+- 🏖️ Sandbox
+- 🐘 Postgres
+- 🔐 SSH
+`;
+export const architectAgent = {
+    role: 'architect',
+    id: 'ag-architect',
+    displayName: 'Agentuity Coder Architect',
+    description: 'Senior implementer for complex autonomous tasks - Cadence mode, deep reasoning, extended execution',
+    defaultModel: 'openai/gpt-5.2-codex',
+    systemPrompt: ARCHITECT_SYSTEM_PROMPT,
+    reasoningEffort: 'xhigh', // Maximum reasoning for complex tasks
+    temperature: 0.1, // Deterministic - precise code generation
+};
+//# sourceMappingURL=architect.js.map

package/dist/agents/architect.js.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"architect.js","sourceRoot":"","sources":["../../src/agents/architect.ts"],"names":[],"mappings":"AAEA,MAAM,CAAC,MAAM,uBAAuB,GAAG;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;CAuPtC,CAAC;AAEF,MAAM,CAAC,MAAM,cAAc,GAAoB;IAC9C,IAAI,EAAE,WAAW;IACjB,EAAE,EAAE,cAAc;IAClB,WAAW,EAAE,2BAA2B;IACxC,WAAW,EACV,oGAAoG;IACrG,YAAY,EAAE,sBAAsB;IACpC,YAAY,EAAE,uBAAuB;IACrC,eAAe,EAAE,OAAO,EAAE,sCAAsC;IAChE,WAAW,EAAE,GAAG,EAAE,0CAA0C;CAC5D,CAAC"}