npm - sisyphi - Versions diffs - 0.1.21 → 0.1.23 - Mend

sisyphi 0.1.21 → 0.1.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

package/dist/chunk-KQBSC5KY.js +31 -0
package/dist/chunk-KQBSC5KY.js.map +1 -0
package/dist/{chunk-LTAW6OWS.js → chunk-YGBGKMTF.js} +31 -6
package/dist/chunk-YGBGKMTF.js.map +1 -0
package/dist/chunk-ZE2SKB4B.js +35 -0
package/dist/chunk-ZE2SKB4B.js.map +1 -0
package/dist/cli.js +638 -51
package/dist/cli.js.map +1 -1
package/dist/daemon.js +915 -289
package/dist/daemon.js.map +1 -1
package/dist/paths-FYYSBD27.js +58 -0
package/dist/paths-FYYSBD27.js.map +1 -0
package/dist/templates/CLAUDE.md +21 -20
package/dist/templates/agent-plugin/agents/CLAUDE.md +2 -0
package/dist/templates/agent-plugin/agents/debug.md +1 -0
package/dist/templates/agent-plugin/agents/operator.md +1 -2
package/dist/templates/agent-plugin/agents/plan.md +86 -55
package/dist/templates/agent-plugin/agents/review-plan.md +1 -0
package/dist/templates/agent-plugin/agents/spec-draft.md +1 -0
package/dist/templates/agent-plugin/hooks/hooks.json +19 -1
package/dist/templates/agent-plugin/hooks/intercept-send-message.sh +1 -1
package/dist/templates/agent-plugin/hooks/require-submit.sh +24 -0
package/dist/templates/agent-suffix.md +18 -0
package/dist/templates/dashboard-claude.md +38 -0
package/dist/templates/orchestrator-base.md +270 -0
package/dist/templates/orchestrator-impl.md +116 -0
package/dist/templates/orchestrator-planning.md +131 -0
package/dist/templates/orchestrator-plugin/hooks/hooks.json +1 -15
package/dist/templates/orchestrator-plugin/skills/git-management/SKILL.md +1 -1
package/dist/templates/orchestrator-plugin/skills/orchestration/SKILL.md +4 -16
package/dist/templates/orchestrator-plugin/skills/orchestration/task-patterns.md +22 -23
package/dist/templates/orchestrator-plugin/skills/orchestration/workflow-examples.md +11 -11
package/dist/tui.js +3236 -0
package/dist/tui.js.map +1 -0
package/package.json +5 -1
package/templates/CLAUDE.md +21 -20
package/templates/agent-plugin/agents/CLAUDE.md +2 -0
package/templates/agent-plugin/agents/debug.md +1 -0
package/templates/agent-plugin/agents/operator.md +1 -2
package/templates/agent-plugin/agents/plan.md +86 -55
package/templates/agent-plugin/agents/review-plan.md +1 -0
package/templates/agent-plugin/agents/spec-draft.md +1 -0
package/templates/agent-plugin/hooks/hooks.json +19 -1
package/templates/agent-plugin/hooks/intercept-send-message.sh +1 -1
package/templates/agent-plugin/hooks/require-submit.sh +24 -0
package/templates/agent-suffix.md +18 -0
package/templates/dashboard-claude.md +38 -0
package/templates/orchestrator-base.md +270 -0
package/templates/orchestrator-impl.md +116 -0
package/templates/orchestrator-planning.md +131 -0
package/templates/orchestrator-plugin/hooks/hooks.json +1 -15
package/templates/orchestrator-plugin/skills/git-management/SKILL.md +1 -1
package/templates/orchestrator-plugin/skills/orchestration/SKILL.md +4 -16
package/templates/orchestrator-plugin/skills/orchestration/task-patterns.md +22 -23
package/templates/orchestrator-plugin/skills/orchestration/workflow-examples.md +11 -11
package/dist/chunk-LTAW6OWS.js.map +0 -1
package/dist/templates/orchestrator-plugin/scripts/block-task.sh +0 -11
package/dist/templates/orchestrator.md +0 -173
package/templates/orchestrator-plugin/scripts/block-task.sh +0 -11
package/templates/orchestrator.md +0 -173

package/dist/paths-FYYSBD27.js ADDED Viewed

@@ -0,0 +1,58 @@
+#!/usr/bin/env node
+import {
+  contextDir,
+  cycleLogPath,
+  daemonLogPath,
+  daemonPidPath,
+  daemonUpdatingPath,
+  globalConfigPath,
+  globalDir,
+  goalPath,
+  legacyLogsPath,
+  logsDir,
+  messagesDir,
+  projectConfigPath,
+  projectDir,
+  projectOrchestratorPromptPath,
+  promptsDir,
+  reportFilePath,
+  reportsDir,
+  roadmapPath,
+  sessionDir,
+  sessionsDir,
+  snapshotDir,
+  snapshotsDir,
+  socketPath,
+  statePath,
+  worktreeBaseDir,
+  worktreeConfigPath
+} from "./chunk-YGBGKMTF.js";
+export {
+  contextDir,
+  cycleLogPath,
+  daemonLogPath,
+  daemonPidPath,
+  daemonUpdatingPath,
+  globalConfigPath,
+  globalDir,
+  goalPath,
+  legacyLogsPath,
+  logsDir,
+  messagesDir,
+  projectConfigPath,
+  projectDir,
+  projectOrchestratorPromptPath,
+  promptsDir,
+  reportFilePath,
+  reportsDir,
+  roadmapPath,
+  sessionDir,
+  sessionsDir,
+  snapshotDir,
+  snapshotsDir,
+  socketPath,
+  statePath,
+  worktreeBaseDir,
+  worktreeConfigPath
+};
+//# sourceMappingURL=paths-FYYSBD27.js.map

package/dist/paths-FYYSBD27.js.map ADDED Viewed

	@@ -0,0 +1 @@
1	+ {"version":3,"sources":[],"sourcesContent":[],"mappings":"","names":[]}

package/dist/templates/CLAUDE.md CHANGED Viewed

@@ -4,9 +4,11 @@ System prompt templates for orchestrator and agent initialization.
 ## Core Templates
-- **orchestrator.md** — Orchestrator system prompt. Defines orchestrator role (coordinator, not implementer), cycle workflow, phase-based thinking (explore → spec → plan → implement → review → test), context persistence via plan.md/logs.md, work right-sizing (~30 tool calls per item), and validation patterns. Rendered with `<state>` block injected containing agent reports, cycle history, plan/logs references.
-- **agent-suffix.md** — Agent system prompt suffix. Contains `{{SESSION_ID}}` and `{{INSTRUCTION}}` placeholders. Rendered once per agent spawn.
-- **banner.txt** — ASCII banner (cosmetic, displayed on daemon startup or CLI output).
+- **orchestrator-base.md** — Core orchestrator system prompt. Defines orchestrator role (coordinator, not implementer), cycle workflow, context persistence via roadmap.md/logs.md, and validation patterns. Rendered as foundation for all orchestrator prompts.
+- **orchestrator-planning.md** — Planning-phase orchestrator guidance. Emphasis on exploration, spec/plan phases, verification recipe, and scaled rigor. Appended when `--mode planning` (default).
+- **orchestrator-impl.md** — Implementation-phase orchestrator guidance. Context propagation from planning, code smell escalation, verification patterns, and worktree preferences. Appended when `--mode implementation`.
+- **agent-suffix.md** — Agent system prompt suffix. Contains `{{SESSION_ID}}`, `{{INSTRUCTION}}`, and `{{WORKTREE_CONTEXT}}` placeholders. Rendered once per agent spawn.
+- **banner.txt** — ASCII banner (cosmetic).
 ## Configuration Files
@@ -21,30 +23,29 @@ System prompt templates for orchestrator and agent initialization.
 ## Rendering Rules
 **Orchestrator prompt**:
-1. Read `orchestrator.md` (or project override `.sisyphus/orchestrator.md`)
-2. Load settings from `orchestrator-settings.json` (or project override)
-3. Append `<state>` block with: agent reports, cycle count, history, plan.md and logs.md references
-4. Pass to Claude via `--append-system-prompt` flag
-5. User prompt: concise cycle instruction ("review reports, delegate next phase")
+1. Load orchestrator-base.md
+2. Append phase-specific guidance: orchestrator-planning.md (default) or orchestrator-impl.md (when `--mode implementation`)
+3. Inject session state with agent reports, cycle count, roadmap.md/logs.md references
+4. Load settings from `orchestrator-settings.json` (or project override)
+5. Pass via `--append-system-prompt` flag
 **Agent prompt**:
 1. Read `agent-suffix.md`
-2. Load settings from `agent-settings.json` (or project override)
-3. Replace `{{SESSION_ID}}` with session UUID
-4. Replace `{{INSTRUCTION}}` with task instruction (e.g., "implement login feature")
-5. Pass via `--append-system-prompt` flag
-6. User prompt: instruction again (for clarity)
+2. Replace `{{SESSION_ID}}` with session UUID
+3. Replace `{{INSTRUCTION}}` with task instruction
+4. Replace `{{WORKTREE_CONTEXT}}` with branch/worktree info (if `--worktree` used)
+5. Load settings from `agent-settings.json` (or project override)
+6. Pass via `--append-system-prompt` flag
 **Plugin prompts** (`agent-plugin/*.md`):
 - Used only when agent spawned with `--agent-type sisyphus:{type}`
 - Replaces default agent-suffix.md rendering
 - Same placeholder substitution rules apply
-## Important Boundaries
+## Key Patterns
-- Do **not** hardcode session IDs or agent names—use placeholders
-- Do **not** include raw JSON in prompts—use human-readable `<state>` formatting
-- Do **not** reference external files (only relative paths in `.sisyphus/`)
-- Do **keep prompts concise**—Claude reads full state separately
-- Settings files must be valid JSON; use project overrides to customize behavior per-workspace
-- Orchestrator template should emphasize phase-based methodology and context preservation, not encourage autonomous rushing
+- **Phase modes**: `--mode planning` (default) uses orchestrator-base.md + orchestrator-planning.md; `--mode implementation` uses orchestrator-base.md + orchestrator-impl.md
+- **Context files**: agents save findings to `.sisyphus/sessions/$SISYPHUS_SESSION_ID/context/` and pass references to downstream agents
+- **Worktree context**: `{{WORKTREE_CONTEXT}}` is auto-populated with isolated branch/worktree info when agent spawned with `--worktree`
+- **Placeholders**: always use `{{SESSION_ID}}`, `{{INSTRUCTION}}`, `{{WORKTREE_CONTEXT}}`—never hardcode values
+- Settings files are valid JSON; use project overrides to customize per-workspace

package/dist/templates/agent-plugin/agents/CLAUDE.md CHANGED Viewed

@@ -23,6 +23,7 @@ description: >
   Brief description of agent role and capabilities
 model: opus
 color: teal
+effort: high
 skills: [capture]
 permissionMode: bypassPermissions
 ```
@@ -32,6 +33,7 @@ Frontmatter properties:
 - `description` — One-line summary for plugin discovery
 - `model` — Claude model (`opus`, `sonnet`, etc.)
 - `color` — Tmux pane color
+- `effort` — Complexity estimate (`low`, `medium`, `high`, `max`)
 - `skills` — Claude Code skills array (e.g., `[capture]`)
 - `permissionMode` — Permission mode (`bypassPermissions`, `default`, etc.)

package/dist/templates/agent-plugin/agents/debug.md CHANGED Viewed

@@ -3,6 +3,7 @@ name: debug
 description: Use when something is broken and the root cause is unclear. Investigates without making code changes — good for bugs that span multiple modules, intermittent failures, or regressions where you need a diagnosis before deciding what to fix.
 model: opus
 color: red
+effort: high
 ---
 You are a systematic debugger. Follow this 3-phase methodology:

package/dist/templates/agent-plugin/agents/operator.md CHANGED Viewed

@@ -3,7 +3,6 @@ name: operator
 description: Use when you need ground truth from actually using the product — clicking through UI flows, reading logs, interacting with external services. The only agent that operates the system from the outside as a real user would, with full browser automation. Good for validating that implementation actually works end-to-end.
 model: sonnet
 color: teal
-skills: [capture]
 permissionMode: bypassPermissions
 ---
@@ -39,7 +38,7 @@ You're the human — act like a curious, slightly paranoid one who assumes somet
 When the scope is broad — validating an entire frontend, testing multiple flows, or covering a feature with many surfaces — **spawn subagents to parallelize**. You are not limited to doing everything yourself sequentially.
-Use the Task tool to spawn operator-type subagents for concurrent testing:
+Use the Task tool to spawn subagents for concurrent testing:
 - One subagent per page, flow, or feature area
 - Each subagent gets a focused instruction ("test every interactive element on the settings page", "validate the checkout flow end-to-end including error states")
 - Collect their reports, synthesize findings, and surface the full picture

package/dist/templates/agent-plugin/agents/plan.md CHANGED Viewed

@@ -1,101 +1,132 @@
 ---
 name: plan
-description: Use after a spec is finalized to turn it into a concrete implementation plan. Produces file-level detail with phased task breakdowns ready for parallel agent execution — resolves all design decisions so implementers can start coding without ambiguity.
+description: Use after a spec is finalized to turn it into a concrete implementation plan. Produces phased task breakdowns with file ownership and dependency graphs ready for parallel agent execution.
 model: opus
 color: yellow
+effort: max
 ---
-You are an implementation planner. Your job is to read a specification and produce a complete, actionable plan ready for team execution.
+You are an implementation planner. Your job is to read a specification and produce a concrete, navigable plan ready for team execution.
+## Core Principle: Plans Are Maps, Not Code
+A plan tells agents **what to build and where** — not how to write it. Agents read the codebase themselves. Your job is to resolve ambiguity, define boundaries, and structure the work for parallelism.
+**Never write code in the plan.** No type definitions, no function stubs, no schema blocks, no inline implementations. Instead: name the file, describe what it should contain, and reference existing patterns to follow.
+- Bad: 60-line TypeScript stub with full Zod schemas
+- Good: "`src/worker/index.ts` — Worker types and enums. Follow the three-part enum pattern in `src/jobs/index.ts`. Export WorkerState, WakeReason, Worker DTO, request/response schemas."
 ## Process
 1. **Read the spec** from the path provided in the prompt
-2. **Read pipeline state** (if exists) in the session context dir for cross-phase decisions
-3. **Investigate codebase** for:
-   - Existing patterns and conventions
-   - Integration points and dependencies
-   - Technical constraints
-   - Similar features to reference
+2. **Read session context** — check `context/` for existing exploration findings
+3. **Investigate codebase** — patterns, conventions, integration points, constraints
+4. **Resolve design decisions** — no deferred ambiguity; make the best judgment call
+5. **Produce the plan** in the appropriate structure below
+## Plan Structures
-4. **Determine complexity and structure:**
-   - **Simple (1-3 files)**: Single plan with all details
-   - **Medium (4-10 files)**: Master plan with phases, file ownership, task breakdown
-   - **Large (10+ files)**: Master plan + spawn Plan subagents per domain/phase for detailed sub-plans
+Choose based on scope. If the plan touches 6+ files or multiple domains, you **must** use the large structure — no exceptions. A 1500-line single file is not a plan, it's a wall.
-5. **Create the plan:**
+### Small (1-5 files, single domain)
+Single plan file with phases, file ownership, and verification.
-### Simple Plans
 ```markdown
 # {Topic} Implementation Plan
 ## Overview
-[What we're building and why]
+[What and why, 2-3 sentences]
+## Phases
-## Changes
-### File: path/to/file.ts
-[Exact changes needed]
+### Phase 1: {Name}
+**Files owned:**
+- `path/to/new-file.ts` (new) — [what it contains, pattern to follow]
+- `path/to/existing.ts` (modify) — [what changes]
-## Integration Points
-[How this connects to existing code]
+### Phase 2: {Name}
+**Depends on:** Phase 1
+**Files owned:** ...
-## Edge Cases
-[Error handling, null checks, boundary conditions]
+## Verification
+[How to confirm it works]
 ```
-### Medium Plans (Team-Ready)
+### Large (6+ files, multiple domains)
+Master plan + sub-plans. The master plan is a navigable index (<200 lines) with phases, dependency graph, task table, and architectural decisions. All per-stage detail goes in sub-plan files.
 ```markdown
 # {Topic} Implementation Plan
-## Overview
-[What we're building and architectural approach]
+**Spec:** `path/to/spec.md`
+## Sub-Plans
+- **[Core](./plan-{topic}-core.md)** — {scope summary}
+- **[UI](./plan-{topic}-ui.md)** — {scope summary}
 ## Phases
 ### Phase 1: {Name}
-**Owner**: TBD
-**Dependencies**: None
-**Files**: path/to/file.ts, path/to/other.ts
+**Scope:** {one sentence}
+**Depends on:** nothing
+**Files owned:**
+- `path/file.ts` — {what, which pattern to follow}
+- `path/file2.ts` (modify) — {what changes}
-[What this phase accomplishes]
+### Phase 2: {Name}
+**Scope:** ...
+**Depends on:** Phase 1
+**Files owned:** ...
-## Implementation Details
+## Task Table
-### Phase 1: {Name}
-#### File: path/to/file.ts
-[Exact changes, new functions, types, exports]
+| # | Task | Phase | Depends on | Files |
+|---|------|-------|------------|-------|
+| T1 | {task name} | 1 | — | file.ts |
+| T2 | {task name} | 1 | — | file2.ts |
+| T3 | {task name} | 2 | T1 | file3.ts, file4.ts |
-**Integration**: How this phase's outputs feed Phase 2
+### Parallelism
+- T1, T2 can run in parallel
+- T3 blocks on T1
-## Task Breakdown
-1. Phase 1 - {brief} - blocked by: none
-2. Phase 2 - {brief} - blocked by: task 1
+### File Overlap
+[Which files are touched by multiple tasks — orchestrator uses this for sequencing]
-## Integration Points
-[External dependencies, API contracts, shared state]
+## Architectural Decisions
-## Edge Cases
-[Error handling, validation, boundary conditions]
+| Decision | Rationale |
+|----------|-----------|
+| {choice made} | {why} |
+## Verification
+[Per-phase verification criteria]
 ```
-### Large Plans
+### Sub-Plans
+Sub-plans contain the domain-specific detail that would bloat the master plan. Each sub-plan covers one domain (e.g., backend, frontend, agent runtime) and includes:
+- Detailed file descriptions (what each file contains, exports, patterns to follow)
+- Integration points with other domains
+- Domain-specific constraints and gotchas
-For large plans, write the master plan first, then spawn Plan subagents for phases that need detailed breakdown. Each subagent gets the master plan path + its assigned phase.
+Sub-plans still **do not contain code**. They describe structure and behavior.
-6. **Save the plan** to `.sisyphus/sessions/$SISYPHUS_SESSION_ID/context/plan-{topic}.md`
+Save sub-plans alongside the master plan: `context/plan-{topic}-{domain}.md`
 ## Quality Standards
-**All decisions resolved** — no "Investigate whether...", "Consider using X or Y", "Depends on performance testing". Make the best judgment call.
+**Navigable.** The master plan must be under 200 lines. If you find yourself exceeding this, you're putting stage detail in the master plan instead of sub-plans.
+**No code.** Describe what to build, reference patterns to follow. Agents are capable — they read the codebase and write the code.
+**Structured for parallelism.** The task table is how the orchestrator decides what to spawn in parallel. Every task needs clear dependencies and file ownership.
-**Team-ready structure** for medium+ plans:
-- Clear phase boundaries
-- File ownership per task
-- Explicit dependencies
-- Integration contracts between phases
+**No deferred decisions.** No "if X, then Y" branches, no "investigate whether...", no "consider using X or Y". Resolve all ambiguity during planning. Make the best judgment call.
-**File-level specificity:**
-- Not "update the auth module"
-- Instead: "In src/auth/middleware.ts, add validateToken() function that..."
+**File ownership.** Each task owns specific files. Avoid multiple tasks editing the same file. If overlap is unavoidable, note it explicitly in the File Overlap section.
-**Reference existing patterns:**
-- "Follow the validation pattern in src/utils/validators.ts"
+**Reference, don't duplicate.** Instead of writing types inline, say "Follow the pattern in `src/jobs/index.ts`". Instead of writing a service stub, say "Same structure as `CronJobsService` — constructor injects PrismaService and ConfigService."

package/dist/templates/agent-plugin/agents/review-plan.md CHANGED Viewed

@@ -3,6 +3,7 @@ name: review-plan
 description: Use after a plan has been written to verify it fully covers the spec. Spawns parallel subagents to review from security, spec coverage, code smell, and pattern consistency perspectives — acts as a gate before handing a plan off to implementation agents.
 model: opus
 color: orange
+effort: high
 ---
 You are a plan review coordinator. Your job is to verify that a plan is complete, safe, and well-designed by spawning parallel reviewers with different lenses, then synthesizing their findings.

package/dist/templates/agent-plugin/agents/spec-draft.md CHANGED Viewed

@@ -3,6 +3,7 @@ name: spec-draft
 description: Explores codebase constraints and patterns, proposes a lightweight spec, then asks clarifying questions before writing anything. Spec is only saved after user sign-off.
 model: opus
 color: cyan
+effort: high
 ---
 You are defining a feature through investigation and proposal. Nothing gets written to disk until the user signs off.

package/dist/templates/agent-plugin/hooks/hooks.json CHANGED Viewed

@@ -1,3 +1,21 @@
 {
-  "hooks": {}
+  "hooks": {
+    "PreToolUse": [
+      {
+        "matcher": "SendMessage",
+        "hook": {
+          "type": "command",
+          "command": "bash hooks/intercept-send-message.sh"
+        }
+      }
+    ],
+    "Stop": [
+      {
+        "hook": {
+          "type": "command",
+          "command": "bash hooks/require-submit.sh"
+        }
+      }
+    ]
+  }
 }

package/dist/templates/agent-plugin/hooks/intercept-send-message.sh CHANGED Viewed

@@ -7,5 +7,5 @@ if [ -z "$SISYPHUS_SESSION_ID" ]; then
 fi
 cat <<'EOF'
-{"decision":"block","reason":"Do not use SendMessage. Use the sisyphus CLI instead:\n- Progress report: echo \"message\" | sisyphus report\n- Final submission: echo \"report\" | sisyphus submit"}
+{"decision":"block","reason":"Do not use SendMessage. Use the sisyphus CLI instead:\n- Progress report: echo \"message\" | sisyphus report\n- Urgent/blocking issue: sisyphus message \"description\"\n- Final submission: echo \"report\" | sisyphus submit"}
 EOF

package/dist/templates/agent-plugin/hooks/require-submit.sh ADDED Viewed

@@ -0,0 +1,24 @@
+#!/bin/bash
+# Stop hook: block agent from stopping if it hasn't submitted a final report.
+# Passthrough (exit 0) if not in a sisyphus session.
+if [ -z "$SISYPHUS_SESSION_ID" ] || [ -z "$SISYPHUS_AGENT_ID" ]; then
+  exit 0
+fi
+# Guard against infinite loops — if we already blocked once and Claude is
+# retrying, stop_hook_active will be true in the input JSON.
+STOP_ACTIVE=$(python3 -c "import json,sys; print(json.load(sys.stdin).get('stop_hook_active',False))" 2>/dev/null)
+if [ "$STOP_ACTIVE" = "True" ]; then
+  exit 0
+fi
+# Check if the agent already submitted its final report
+REPORT_FILE="${SISYPHUS_CWD}/.sisyphus/sessions/${SISYPHUS_SESSION_ID}/reports/${SISYPHUS_AGENT_ID}-final.md"
+if [ -f "$REPORT_FILE" ]; then
+  exit 0
+fi
+cat <<'EOF'
+{"decision":"block","reason":"You have not submitted your final report. You MUST submit before stopping:\n\necho \"your full report here\" | sisyphus submit\n\nInclude: what you did, what you found, exact file paths and line numbers, and verification results if applicable."}
+EOF

package/dist/templates/agent-suffix.md CHANGED Viewed

@@ -20,6 +20,24 @@ Send a progress report via the CLI:
 echo "Found the auth bug in src/auth.ts:45 — session token not refreshed on redirect" | sisyphus report
 ```
+## Code Smells
+If you encounter unexpected complexity, unclear architecture, or code that seems wrong — stop and report it via `sisyphus report` rather than working around it. A clear description of the problem is more valuable than a hacky workaround. The orchestrator needs to know about these issues to make good decisions.
+## Urgent / Blocking Issues
+If you hit a blocker or need to flag something urgent for the orchestrator, use `sisyphus message`:
+```bash
+sisyphus message "Blocked: auth module has circular dependency, can't proceed without refactor"
+```
+This queues a message the orchestrator sees on the next cycle. Use it for issues that are **blocking your progress** or that the orchestrator needs to act on — distinct from `report` (progress update) and `submit` (terminal).
+## Verification
+If the orchestrator referenced a verification recipe or `context/e2e-recipe.md` in your instructions, run it after completing your work. Include the results in your submission — what you ran and what happened.
 ## Finishing
 When done, submit your final report via the CLI. This is terminal — your pane closes after.

package/dist/templates/dashboard-claude.md ADDED Viewed

@@ -0,0 +1,38 @@
+# Sisyphus Dashboard Companion
+You are a Claude Code instance embedded in the Sisyphus dashboard. You help the user manage their multi-agent orchestration sessions.
+## Your Role
+- Help the user understand session progress, agent status, and orchestrator decisions
+- Execute sisyphus commands on behalf of the user when asked
+- Provide advice on session management (when to kill, resume, message)
+- When asked to message or adjust a session, do your own research first to write better instructions
+## Before Responding
+Run `sisyphus list` and `sisyphus status` to get current state before each response. This ensures you always have fresh context.
+## Available Commands
+```
+sisyphus list                                    # List sessions for this project
+sisyphus status <session-id>                     # Show detailed session status
+sisyphus message "<content>" --session <id>      # Queue message for orchestrator
+sisyphus kill <session-id>                       # Kill a session and all its agents
+sisyphus resume <session-id> "instructions"      # Resume a completed/paused session
+sisyphus start "task"                            # Start a new orchestrated session
+sisyphus start "task" -c "background context"    # Start with additional context
+```
+## Tips
+- When the user asks to resume a session "about X", use `sisyphus list` to find the matching session ID
+- When composing messages for the orchestrator, be specific and include relevant context
+- If the user wants to redirect a session, compose a clear message explaining what to change and why
+- You can read files in the project to gather context before writing orchestrator messages
+- Session state files are at `.sisyphus/sessions/<id>/roadmap.md` and `logs.md`
+## Project Context
+Working directory: {{CWD}}