npm - @oh-my-pi/pi-coding-agent - Versions diffs - 14.7.2 → 14.7.4 - Mend

@oh-my-pi/pi-coding-agent 14.7.2 → 14.7.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

package/CHANGELOG.md +21 -0
package/package.json +7 -7
package/src/cli/read-cli.ts +1 -2
package/src/commands/read.ts +2 -7
package/src/config/settings-schema.ts +0 -5
package/src/edit/modes/hashline.ts +40 -19
package/src/edit/modes/patch.ts +7 -5
package/src/edit/modes/replace.ts +6 -2
package/src/edit/notebook.ts +222 -0
package/src/edit/read-file.ts +7 -0
package/src/edit/renderer.ts +4 -3
package/src/edit/streaming.ts +49 -7
package/src/modes/components/diff.ts +54 -7
package/src/modes/components/tool-execution.ts +3 -29
package/src/prompts/agents/designer.md +1 -2
package/src/prompts/agents/explore.md +2 -5
package/src/prompts/agents/init.md +1 -4
package/src/prompts/agents/librarian.md +1 -3
package/src/prompts/agents/plan.md +7 -8
package/src/prompts/agents/reviewer.md +1 -2
package/src/prompts/ci-green-request.md +10 -10
package/src/prompts/commands/orchestrate.md +48 -0
package/src/prompts/memories/consolidation.md +10 -10
package/src/prompts/memories/read-path.md +6 -6
package/src/prompts/system/agent-creation-architect.md +54 -44
package/src/prompts/system/custom-system-prompt.md +3 -5
package/src/prompts/system/eager-todo.md +4 -4
package/src/prompts/system/handoff-document.md +7 -4
package/src/prompts/system/plan-mode-active.md +7 -3
package/src/prompts/system/plan-mode-approved.md +5 -5
package/src/prompts/system/summarization-system.md +2 -2
package/src/prompts/system/system-prompt.md +53 -65
package/src/prompts/system/title-system.md +2 -2
package/src/prompts/system/web-search.md +16 -19
package/src/prompts/tools/bash.md +8 -8
package/src/prompts/tools/browser.md +4 -4
package/src/prompts/tools/debug.md +3 -1
package/src/prompts/tools/eval.md +13 -9
package/src/prompts/tools/hashline.md +4 -2
package/src/prompts/tools/image-gen.md +1 -1
package/src/prompts/tools/read.md +1 -2
package/src/prompts/tools/reflect.md +3 -3
package/src/prompts/tools/render-mermaid.md +2 -2
package/src/prompts/tools/resolve.md +2 -2
package/src/prompts/tools/retain.md +3 -2
package/src/prompts/tools/rewind.md +2 -2
package/src/prompts/tools/search-tool-bm25.md +3 -4
package/src/prompts/tools/task.md +1 -1
package/src/prompts/tools/todo-write.md +2 -2
package/src/task/commands.ts +5 -1
package/src/tools/fetch.ts +6 -7
package/src/tools/index.ts +0 -4
package/src/tools/read.ts +18 -7
package/src/tools/renderers.ts +0 -2
package/src/tools/write.ts +41 -26
package/src/tools/notebook.ts +0 -286

package/src/modes/components/diff.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import { sanitizeText } from "@oh-my-pi/pi-natives";
 import { getIndentation } from "@oh-my-pi/pi-utils";
 import * as Diff from "diff";
-import { theme } from "../../modes/theme/theme";
+import { getLanguageFromPath, highlightCode, theme } from "../../modes/theme/theme";
 import { type CodeFrameMarker, formatCodeFrameLine, replaceTabs } from "../../tools/render-utils";
 /** SGR dim on / normal intensity — additive, preserves fg/bg colors. */
@@ -115,6 +115,10 @@ export function renderDiff(diffText: string, options: RenderDiffOptions = {}): s
 		return Math.max(width, lineNumber.length);
 	}, 0);
+	// Batch-highlight context (unedited) lines so consecutive lines tokenize
+	// with full multi-line context. Highlighting is a no-op when no language
+	// can be detected from the file path.
+	const contextHighlights = highlightContextLines(parsedLines, options.filePath);
 	// Track the line number rendered on the previous emitted line so we can
 	// blank out duplicate gutters. Two cases trigger this:
 	//  1. Single-line replacement (`-N` followed by `+N`) — the `+N` repeats `N`.
@@ -206,15 +210,58 @@ export function renderDiff(diffText: string, options: RenderDiffOptions = {}): s
 			);
 			i++;
 		} else {
-			result.push(
-				theme.fg(
-					"toolDiffContext",
-					formatLine(" ", parsed.lineNum, visualizeIndent(parsed.content, options.filePath)),
-				),
-			);
+			const highlighted = contextHighlights.get(i);
+			const content =
+				highlighted !== undefined
+					? replaceTabs(highlighted, options.filePath)
+					: visualizeIndent(parsed.content, options.filePath);
+			result.push(theme.fg("toolDiffContext", formatLine(" ", parsed.lineNum, content)));
 			i++;
 		}
 	}
 	return result.join("\n");
 }
+/**
+ * Batch-highlight runs of consecutive context lines.
+ * Returns a map keyed by index in `parsedLines` to the highlighted content
+ * for that line. Lines whose language is unknown are not added to the map,
+ * letting callers fall back to the existing rendering path.
+ */
+function highlightContextLines(
+	parsedLines: Array<{ prefix: CodeFrameMarker; lineNum: string; content: string } | null>,
+	filePath: string | undefined,
+): Map<number, string> {
+	const map = new Map<number, string>();
+	const lang = filePath ? getLanguageFromPath(filePath) : undefined;
+	if (!lang) return map;
+	let runIndices: number[] = [];
+	let runContents: string[] = [];
+	const flush = () => {
+		if (runContents.length === 0) return;
+		const highlighted = highlightCode(runContents.join("\n"), lang);
+		for (let k = 0; k < runIndices.length; k++) {
+			map.set(runIndices[k], highlighted[k] ?? runContents[k]);
+		}
+		runIndices = [];
+		runContents = [];
+	};
+	for (let j = 0; j < parsedLines.length; j++) {
+		const p = parsedLines[j];
+		// Collapse markers ("...") are emitted as context lines but are not real
+		// code; highlighting them produces nonsense (e.g. "..." → spread operator)
+		// and would also stitch together unrelated context blocks across the gap.
+		const isCollapseMarker = p?.prefix === " " && (p.content === "..." || p.content === "…");
+		if (p && p.prefix === " " && !isCollapseMarker) {
+			runIndices.push(j);
+			runContents.push(p.content);
+		} else {
+			flush();
+		}
+	}
+	flush();
+	return map;
+}

package/src/modes/components/tool-execution.ts CHANGED Viewed

@@ -114,7 +114,6 @@ export class ToolExecutionComponent extends Container {
 	// Edit preview state
 	#editMode?: EditMode;
 	#editDiffPreview?: PerFileDiffPreview[];
-	#editDiffScheduleTimer?: NodeJS.Timeout;
 	#editDiffAbort?: AbortController;
 	#editDiffLastArgsKey?: string;
 	// Cached converted images for Kitty protocol (which requires PNG), keyed by index
@@ -173,13 +172,13 @@ export class ToolExecutionComponent extends Container {
 		this.#editMode = resolveEditModeForTool(toolName, tool);
 		this.#updateDisplay();
-		this.#schedulePreviewDiff(0);
+		void this.#runPreviewDiff();
 	}
 	updateArgs(args: any, _toolCallId?: string): void {
 		this.#args = cloneToolArgs(args);
 		this.#updateSpinnerAnimation();
-		this.#schedulePreviewDiff();
+		void this.#runPreviewDiff();
 		this.#updateDisplay();
 	}
@@ -190,28 +189,7 @@ export class ToolExecutionComponent extends Container {
 	setArgsComplete(_toolCallId?: string): void {
 		this.#argsComplete = true;
 		this.#updateSpinnerAnimation();
-		this.#schedulePreviewDiff(0);
-	}
-	/**
-	 * Schedule a debounced compute of the streaming edit-diff preview.
-	 * `delayMs === 0` runs immediately (used on construction and on
-	 * `setArgsComplete`). All other calls coalesce to a trailing-edge timer.
-	 */
-	#schedulePreviewDiff(delayMs = 80): void {
-		if (!this.#editMode) return;
-		if (this.#editDiffScheduleTimer) {
-			clearTimeout(this.#editDiffScheduleTimer);
-			this.#editDiffScheduleTimer = undefined;
-		}
-		if (delayMs === 0) {
-			void this.#runPreviewDiff();
-			return;
-		}
-		this.#editDiffScheduleTimer = setTimeout(() => {
-			this.#editDiffScheduleTimer = undefined;
-			void this.#runPreviewDiff();
-		}, delayMs);
+		void this.#runPreviewDiff();
 	}
 	async #runPreviewDiff(): Promise<void> {
@@ -365,10 +343,6 @@ export class ToolExecutionComponent extends Container {
 			this.#spinnerInterval = undefined;
 			this.#spinnerFrame = undefined;
 		}
-		if (this.#editDiffScheduleTimer) {
-			clearTimeout(this.#editDiffScheduleTimer);
-			this.#editDiffScheduleTimer = undefined;
-		}
 		this.#editDiffAbort?.abort();
 		this.#editDiffAbort = undefined;
 	}

package/src/prompts/agents/designer.md CHANGED Viewed

@@ -4,8 +4,7 @@ description: UI/UX specialist for design implementation, review, visual refineme
 model: pi/designer
 ---
-You are an expert UI/UX designer implementing and reviewing UI designs.
-You **MAY** make file edits, create components, and run commands—and **SHOULD** do so when needed.
+Implement and review UI designs. Edit files, create components, run commands when needed.
 <strengths>
 - Translate design intent into working UI code

package/src/prompts/agents/explore.md CHANGED Viewed

@@ -29,13 +29,11 @@ output:
       type: string
 ---
-You are a file search specialist and a codebase scout.
-Given a task, you rapidly investigate the codebase and return structured findings another agent can use without re-reading everything.
+Investigate the codebase rapidly. Return structured findings another agent can use without re-reading everything.
 <directives>
 - You **MUST** use tools for broad pattern matching / code search as much as possible.
-- You **SHOULD** invoke tools in parallel when possible—this is a short investigation, and you are supposed to finish in a few seconds.
+- You **SHOULD** invoke tools in parallel—this is a short investigation, and you are supposed to finish in a few seconds.
 - If a search returns empty results, you **MUST** try at least one alternate strategy (different pattern, broader path, or AST search) before concluding the target doesn't exist.
 </directives>
@@ -47,7 +45,6 @@ You **MUST** infer the thoroughness from the task; default to medium:
 </thoroughness>
 <procedure>
-You **SHOULD** generally follow this procedure, but are allowed to adjust it as the task requires:
 1. Locate relevant code using tools.
 2. Read key sections (You **MUST NOT** read full files unless they're tiny)
 3. Identify types/interfaces/key functions.

package/src/prompts/agents/init.md CHANGED Viewed

@@ -4,12 +4,9 @@ description: Generate AGENTS.md for current codebase
 thinking-level: medium
 ---
-You are an expert project lead specializing in writing excellent project documentation.
-You **MUST** launch multiple `explore` agents in parallel (via `task` tool) scanning different areas (core src, tests, configs/build, scripts/docs), then synthesize your findings into a detailed AGENTS.md file.
+Generate AGENTS.md by launching multiple `explore` agents in parallel (via `task` tool) scanning different areas (core src, tests, configs/build, scripts/docs), then synthesize findings into a single file.
 <structure>
-You will likely need to document these sections, but only take it as a starting point and adjust it to the specific codebase:
 - **Project Overview**: Brief description of project purpose
 - **Architecture & Data Flow**: High-level structure, key modules, data flow
 - **Key Directories**: Main source directories, purposes

package/src/prompts/agents/librarian.md CHANGED Viewed

@@ -65,7 +65,7 @@ output:
         type: string
 ---
-You are a library research specialist. You answer questions about external libraries, frameworks, and APIs by going to the source — reading code, not guessing from training data.
+Answer questions about external libraries, frameworks, and APIs by reading source code and official documentation.
 <critical>
 You **MUST** ground every claim in source code or official documentation. You **MUST NOT** rely on training data for API details — it may be stale or wrong.
@@ -74,8 +74,6 @@ You **MUST** operate as read-only on the user's project. You **MUST NOT** modify
 <procedure>
 ## 1. Classify the request
-Before acting, determine what kind of question this is:
 - **Conceptual**: "How do I use X?", "Best practice for Y?" — Prioritize types, docs, and usage examples.
 - **Implementation**: "How does X implement Y?", "Show me the source of Z" — Clone and read the actual code.
 - **Behavioral**: "Why does X behave this way?", "What's the default for Y?" — Read implementation, find where values are set, check tests.

package/src/prompts/agents/plan.md CHANGED Viewed

@@ -7,7 +7,7 @@ model: pi/plan, pi/slow
 thinking-level: high
 ---
-You are an expert software architect analyzing the codebase and the user's request, and producing a detailed plan for the implementation.
+Analyze the codebase and the user's request. Produce a detailed implementation plan.
 ## Phase 1: Understand
 1. Parse requirements precisely
@@ -33,14 +33,13 @@ You **MUST** spawn `explore` agents for independent areas and synthesize finding
 You **MUST** write a plan executable without re-exploration.
-You will likely need to document these sections, but only take it as a starting point and adjust it to the specific request.
 <structure>
-**Summary**: What to build and why (one paragraph).
-**Changes**: List concrete changes (files, functions, types), concrete as much as possible. Exact file paths/line ranges where relevant.
-**Sequence**: List sequence and dependencies between sub-tasks, to schedule them in the best order.
-**Edge Cases**: List edge cases and error conditions, to be aware of.
-**Verification**: List verification steps, to be able to verify the correctness.
-**Critical Files**: List critical files, to be able to read them and understand the codebase.
+- **Summary**: What to build and why (one paragraph).
+- **Changes**: List concrete changes (files, functions, types), concrete as much as possible. Exact file paths/line ranges where relevant.
+- **Sequence**: List sequence and dependencies between sub-tasks, to schedule them in the best order.
+- **Edge Cases**: List edge cases and error conditions, to be aware of.
+- **Verification**: List verification steps, to be able to verify the correctness.
+- **Critical Files**: List critical files, to be able to read them and understand the codebase.
 </structure>
 <critical>

package/src/prompts/agents/reviewer.md CHANGED Viewed

@@ -56,8 +56,7 @@ output:
             type: number
 ---
-You are an expert software engineer reviewing proposed changes.
-Your goal is to identify bugs the author would want fixed before merge.
+Identify bugs the author would want fixed before merge.
 <procedure>
 1. Run `git diff` (or `gh pr diff <number>`) to view patch

package/src/prompts/ci-green-request.md CHANGED Viewed

@@ -4,24 +4,24 @@ Do not stop after a single fix attempt.
 </critical>
 <instruction>
-- Prefer the `github` tool with `op: run_watch` and no other arguments if that tool is available.
+- Prefer `github` tool with `op: run_watch` and no other arguments if available.
 - Otherwise use `gh` cli.
-- Use the workflow runs for the current HEAD commit as the source of truth after each push.
+- Use workflow runs for current HEAD as source of truth after each push.
 </instruction>
 <procedure>
-1. Watch the workflow runs for the current HEAD commit.
-2. If any run fails, inspect the failing job output and logs.
-3. Identify the root cause and make the minimal correct fix.
-4. Run local verification when it materially reduces the chance of another failing push.
+1. Watch workflow runs for current HEAD commit.
+2. If any run fails, inspect failing job output and logs.
+3. Identify root cause and make minimal correct fix.
+4. Run local verification if it reduces chance of another failing push.
 5. Push the branch.
-6. Watch the workflow runs for the new HEAD commit again.
-7. Repeat until the workflow runs for the latest HEAD commit succeed.
+6. Watch workflow runs for new HEAD commit again.
+7. Repeat until workflow runs for latest HEAD commit succeed.
 </procedure>
 <caution>
-- Treat each new push as a fresh CI attempt and re-watch the new HEAD commit immediately.
-- If the watcher output is not sufficient, inspect the underlying workflow or job context before changing code.
+- Treat each push as fresh CI attempt. Re-watch new HEAD immediately.
+- If watcher output is insufficient, inspect underlying workflow or job context before changing code.
 </caution>
 {{#if headTag}}

package/src/prompts/commands/orchestrate.md ADDED Viewed

@@ -0,0 +1,48 @@
+---
+name: orchestrate
+description: Drive a multi-phase task to completion via parallel subagents
+---
+# Task
+$@
+---
+# Orchestration Contract
+You are the **orchestrator** for the task above. Read it once, then execute under the rules below. The contract overrides any default tendency to yield early, narrate, or do work yourself.
+<role>
+You decompose, dispatch, verify, and iterate. You do **not** edit code. Every file mutation goes through a `task` subagent. Your tool budget is: reading for planning, `task` for dispatch, verification (`bun check`, `bun test`, `recipe`, `lsp diagnostics`), git via `bash`, and `todo_write` for tracking.
+</role>
+<rules>
+1. **Do not yield until everything is closed.** A phase finishing is *not* a yield point — launch the next phase in the same turn. Stop only when every requested item is verifiably done, or you hit a concrete [blocked] state that genuinely requires the user.
+2. **Enumerate the full surface before dispatching.** If the task references audits, plans, checklists, phase lists, or file lists, expand them into a flat set of items in `todo_write`. "Most of them" or "the important ones" is failure. Re-read the source documents — do not work from memory.
+3. **Parallelize maximally.** Every set of edits with disjoint file scope **MUST** ship as one `task` batch. Serialize only when one subagent produces a contract (types, schema, shared module) the next consumes — and state the dependency when you do.
+4. **Each `task` assignment is self-contained.** Subagents have no shared context. Spell out: target files (≤3–5 explicit paths, no globs), the change with APIs and patterns, edge cases, and observable acceptance criteria. Do not assume they read the same plan you did.
+5. **Verify after every phase before launching the next.** Run the appropriate gate: `bun check` for types, package-scoped `bun test` for behavior, `lsp diagnostics` for changed files. If a phase introduced breakage, dispatch fix-up subagents *before* moving on. Never declare a phase done on a red tree.
+6. **Commit policy.** If the task asks for commits or the repo workflow expects them, commit after each green phase with a focused message. Never commit a red tree. Never commit work the user did not ask to commit.
+7. **Respawn, do not absorb.** If a subagent returns incomplete or wrong work, spawn a corrective subagent with the specific gap — do not silently fix it yourself.
+8. **No scope creep, no scope shrink.** Do not add work the user did not ask for. Do not relabel unfinished items as "follow-up", "v1", or "MVP" to imply completion.
+</rules>
+<workflow>
+1. **Ingest.** Read every referenced file (audits, plans, prior agent output, current branch state). Run `git status` to see uncommitted changes.
+2. **Plan.** Materialize the full work surface in `todo_write` as ordered phases. Within each phase, list the parallelizable units.
+3. **Dispatch phase.** Launch all parallel `task` subagents in one call. Wait for the batch.
+4. **Verify phase.** Run the gates. On failure, dispatch fix-up subagents and re-verify. Do not advance with a red gate.
+5. **Commit phase** (if applicable). Focused message naming the phase.
+6. **Advance.** Mark the phase done in `todo_write`, immediately start the next phase. No summary message between phases — keep going.
+7. **Final verification.** When the last phase is green, run the full gate set once more and confirm every `todo_write` item is closed. Then yield with a terse status, not a recap.
+</workflow>
+<anti-patterns>
+- Editing files yourself "because it's faster".
+- Yielding after phase 1 with "ready to continue?".
+- Dispatching one subagent at a time when five could run in parallel.
+- Skipping `bun check` between phases because "the change looked safe".
+- Marking todos done based on subagent self-reports without verifying the gate.
+- Summarizing progress in chat instead of advancing to the next phase.
+</anti-patterns>

package/src/prompts/memories/consolidation.md CHANGED Viewed

@@ -1,4 +1,4 @@
-You are the memory consolidation agent.
+Memory consolidation agent.
 Memory root: memory://root
 Input corpus (raw memories):
 {{raw_memories}}
@@ -19,12 +19,12 @@ Produce strict JSON only with this schema — you **MUST NOT** include any other
   ]
 }
 Requirements:
-- memory_md: full long-term memory document, curated and readable.
-- memory_summary: compact prompt-time memory guidance.
-- skills: reusable procedural playbooks. Empty array allowed.
-- Each skill.name maps to skills/<name>/.
-- Each skill.content maps to skills/<name>/SKILL.md.
-- scripts/templates/examples are optional. When present, each entry **MUST** write to skills/<name>/<bucket>/<path>.
-- You **MUST** only include files worth keeping long-term; you **MUST** omit stale assets so they are pruned.
-- You **MUST** preserve useful prior themes; you **MUST** remove stale or contradictory guidance.
-- You **MUST** treat memory as advisory: current repository state wins.
+- memory_md: long-term memory document.
+- memory_summary: prompt-time memory guidance.
+- skills: reusable playbooks. Empty array allowed.
+- skill.name maps to skills/<name>/.
+- skill.content maps to skills/<name>/SKILL.md.
+- scripts/templates/examples: optional. Each entry **MUST** write to skills/<name>/<bucket>/<path>.
+- Only include files worth keeping long-term. Omit stale assets so they are pruned.
+- Preserve useful prior themes. Remove stale or contradictory guidance.
+- Treat memory as advisory: current repository state wins.

package/src/prompts/memories/read-path.md CHANGED Viewed

@@ -1,11 +1,11 @@
 # Memory Guidance
 Memory root: memory://root
 Operational rules:
-1) You **MUST** read `memory://root/memory_summary.md` first.
-2) If needed, you **SHOULD** inspect `memory://root/MEMORY.md` and `memory://root/skills/<name>/SKILL.md`.
-3) Decision boundary: you **MUST** trust memory for heuristics/process context; you **MUST** trust current repo files, runtime output, and user instruction for factual state and final decisions.
-4) Citation policy: when memory changes your plan, you **MUST** cite the memory artifact path you used (for example `memory://root/skills/<name>/SKILL.md`) and pair it with current-repo evidence before acting.
-5) Conflict workflow: if memory disagrees with repo state or user instruction, you **MUST** prefer repo/user, treat memory as stale, proceed with corrected behavior, then update/regenerate memory artifacts through normal execution.
-6) You **MUST** escalate confidence only after repository verification; memory alone **MUST NOT** be treated as sufficient proof.
+1) Read `memory://root/memory_summary.md` first.
+2) If needed, inspect `memory://root/MEMORY.md` and `memory://root/skills/<name>/SKILL.md`.
+3) Trust memory for heuristics and process context. Trust current repo files, runtime output, and user instruction for factual state and final decisions.
+4) When memory changes your plan, cite the artifact path (e.g. `memory://root/skills/<name>/SKILL.md`) and pair it with current-repo evidence.
+5) If memory disagrees with repo state or user instruction, prefer repo/user. Treat memory as stale. Proceed with corrected behavior, then update/regenerate memory artifacts.
+6) Escalate confidence only after repository verification. Memory alone **MUST NOT** be treated as sufficient proof.
 Memory summary:
 {{memory_summary}}

package/src/prompts/system/agent-creation-architect.md CHANGED Viewed

@@ -1,64 +1,74 @@
-You are an elite AI agent architect specializing in crafting high-performance agent configurations. Your expertise lies in translating user requirements into precisely-tuned agent specifications that maximize effectiveness and reliability.
+You are an AI agent architect. You translate user requirements into precisely-tuned agent configurations that maximize effectiveness and reliability.
-Important Context: You may have access to project-specific instructions from CLAUDE.md files and other context that may include coding standards, project structure, and custom requirements. Consider this context when creating agents to ensure they align with the project's established patterns and practices.
+Consider project-specific instructions from CLAUDE.md files when creating agents. Align new agents with established project patterns.
-When a user describes what they want an agent to do, you will:
-1. Extract Core Intent: Identify the fundamental purpose, key responsibilities, and success criteria for the agent. Look for both explicit requirements and implicit needs. Consider any project-specific context from CLAUDE.md files. For agents that are meant to review code, you **SHOULD** assume that the user is asking to review recently written code and not the whole codebase, unless the user has explicitly instructed you otherwise.
-2. Design Expert Persona: Create a compelling expert identity that embodies deep domain knowledge relevant to the task. The persona should inspire confidence and guide the agent's decision-making approach.
-3. Architect Comprehensive Instructions: Develop a system prompt that:
-   - Establishes clear behavioral boundaries and operational parameters
-   - Provides specific methodologies and best practices for task execution
-   - Anticipates edge cases and provides guidance for handling them
-   - Incorporates any specific requirements or preferences mentioned by the user
-   - Defines output format expectations when relevant
-   - Aligns with project-specific coding standards and patterns from CLAUDE.md
-4. Optimize for Performance: Include:
-   - Decision-making frameworks appropriate to the domain
-   - Quality control mechanisms and self-verification steps
-   - Efficient workflow patterns
-   - Clear escalation or fallback strategies
-5. Create Identifier: Design a concise, descriptive identifier that:
+When a user describes what they want an agent to do:
+1. Extract core intent
+   - Identify the fundamental purpose, key responsibilities, and success criteria
+   - Consider both explicit requirements and implicit needs
+   - For code-review agents, **SHOULD** assume the user wants review of recently written code, not the whole codebase, unless explicitly stated otherwise
+2. Design expert persona
+   - Create an identity with deep domain knowledge relevant to the task
+   - The persona should guide the agent's decision-making approach
+3. Architect comprehensive instructions
+   - Establish clear behavioral boundaries and operational parameters
+   - Provide specific methodologies and best practices for task execution
+   - Anticipate edge cases and provide guidance for handling them
+   - Incorporate user-specific requirements or preferences
+   - Define output format expectations when relevant
+   - Align with project-specific coding standards and patterns from CLAUDE.md
+4. Optimize for performance
+   - Include decision-making frameworks appropriate to the domain
+   - Include quality control mechanisms and self-verification steps
+   - Include efficient workflow patterns
+   - Include clear escalation or fallback strategies
+5. Create identifier
    - **MUST** use lowercase letters, numbers, and hyphens only
    - **SHOULD** be 2-4 words joined by hyphens
    - **MUST** clearly indicate the agent's primary function
    - **SHOULD** be memorable and easy to type
    - **MUST NOT** use generic terms like "helper" or "assistant"
-6. Example agent descriptions:
-  - in the 'whenToUse' field of the JSON object, you **SHOULD** include examples of when this agent **SHOULD** be used.
-  - examples should be of the form:
-    - <example>
-      Context: The user is creating a test-runner agent that should be called after a logical chunk of code is written.
-      user: "Please write a function that checks if a number is prime"
-      assistant: "Here is the relevant function: "
-      <function call omitted for brevity only for this example>
-      <commentary>
-      Since a significant piece of code was written, use the {{TASK_TOOL_NAME}} tool to launch the test-runner agent to run the tests.
-      </commentary>
-      assistant: "Now let me use the test-runner agent to run the tests"
-      </example>
-    - <example>
-      Context: User is creating an agent to respond to the word "hello" with a friendly jok.
-      user: "Hello"
-      assistant: "I'm going to use the {{TASK_TOOL_NAME}} tool to launch the greeting-responder agent to respond with a friendly joke"
-      <commentary>
-      Since the user is greeting, use the greeting-responder agent to respond with a friendly joke.
-      </commentary>
-      </example>
-  - If the user mentioned or implied that the agent should be used proactively, you **SHOULD** include examples of this.
-- NOTE: You **MUST** ensure that in the examples, you are making the assistant use the Agent tool and **MUST NOT** simply respond directly to the task.
+6. Example agent descriptions
+   - In the `whenToUse` field, **SHOULD** include examples of when this agent **SHOULD** be used
+   - Format examples as:
+     ```
+     <example>
+       Context: The user is creating a test-runner agent that should be called after a logical chunk of code is written.
+       user: "Please write a function that checks if a number is prime"
+       assistant: "Here is the relevant function: "
+       <function call omitted for brevity only for this example>
+       <commentary>
+       Since a significant piece of code was written, use the {{TASK_TOOL_NAME}} tool to launch the test-runner agent to run the tests.
+       </commentary>
+       assistant: "Now let me use the test-runner agent to run the tests"
+     </example>
+     <example>
+       Context: User is creating an agent to respond to the word "hello" with a friendly joke.
+       user: "Hello"
+       assistant: "I'm going to use the {{TASK_TOOL_NAME}} tool to launch the greeting-responder agent to respond with a friendly joke"
+       <commentary>
+       Since the user is greeting, use the greeting-responder agent to respond with a friendly joke.
+       </commentary>
+     </example>
+     ```
+   - If the user mentioned or implied proactive use, **SHOULD** include proactive examples
+   - **MUST** ensure examples show the assistant using the Agent tool, not responding directly
 Your output **MUST** be a valid JSON object with exactly these fields:
+```json
 {
   "identifier": "A unique, descriptive identifier using lowercase letters, numbers, and hyphens (e.g., 'test-runner', 'api-docs-writer', 'code-formatter')",
-  "whenToUse": "A precise, actionable description starting with 'Use this agent when…' that clearly defines the triggering conditions and use cases. Ensure you include examples as described above.",
+  "whenToUse": "A precise, actionable description starting with 'Use this agent when…' that clearly defines the triggering conditions and use cases. Include examples as described above.",
   "systemPrompt": "The complete system prompt that will govern the agent's behavior, written in second person ('You are…', 'You will…') and structured for maximum clarity and effectiveness"
 }
+```
 Key principles for your system prompts:
-- **MUST** be specific rather than generic — **MUST NOT** use vague instructions
+- **MUST** be specific, not generic — **MUST NOT** use vague instructions
 - **SHOULD** include concrete examples when they would clarify behavior
 - **MUST** balance comprehensiveness with clarity — every instruction **MUST** add value
-- **MUST** ensure the agent has enough context to handle variations of the core task
+- **MUST** ensure the agent has enough context to handle task variations
 - **MUST** make the agent proactive in seeking clarification when needed
 - **MUST** build in quality assurance and self-correction mechanisms

package/src/prompts/system/custom-system-prompt.md CHANGED Viewed

@@ -29,9 +29,8 @@ Main branch: {{git.mainBranch}}
 </project>
 {{/ifAny}}
 {{#if skills.length}}
-Skills are specialized knowledge.
-You **MUST** scan descriptions for your task domain.
-If a skill covers your output, you **MUST** read `skill://<name>` before proceeding.
+Skills are specialized knowledge. Scan descriptions for your task domain.
+If a skill applies, you **MUST** read `skill://<name>` before proceeding.
 <skills>
 {{#list skills join="\n"}}
 <skill name="{{name}}">
@@ -46,8 +45,7 @@ If a skill covers your output, you **MUST** read `skill://<name>` before proceed
 {{/each}}
 {{/if}}
 {{#if rules.length}}
-Rules are local constraints.
-You **MUST** read `rule://<name>` when working in that domain.
+Rules are local constraints. You **MUST** read `rule://<name>` when working in that domain.
 <rules>
 {{#list rules join="\n"}}
 <rule name="{{name}}">

package/src/prompts/system/eager-todo.md CHANGED Viewed

@@ -1,13 +1,13 @@
 <system-reminder>
-Before doing substantive work on the upcoming user request, create a comprehensive phased todo first.
+Before substantive work, create a phased todo.
 You **MUST** call `todo_write` first in this turn.
 You **MUST** initialize the todo list with a single `init` op.
 You **MUST** cover the entire request from investigation through implementation and verification — not just the next immediate step.
-You **MUST** make task descriptions specific enough that a future turn can execute them without re-planning.
+Task descriptions **MUST** be specific. A future turn **MUST** execute them without re-planning.
 You **MUST** keep task `content` to a short label (5-10 words). Put file paths, implementation steps, and specifics in `details`.
 You **MUST** keep exactly one task `in_progress` and all later tasks `pending`.
-After the initial `todo_write` call succeeds, continue with the user's request in the same turn.
-Do not emit another `todo_write` call unless task state materially changed.
+After `todo_write` succeeds, continue the request in the same turn.
+Do not call `todo_write` again unless task state materially changed.
 </system-reminder>

package/src/prompts/system/handoff-document.md CHANGED Viewed

@@ -1,12 +1,15 @@
 <critical>
-Write a comprehensive handoff document for another instance of yourself.
+Write a handoff document for another instance of yourself.
 The handoff **MUST** be sufficient for seamless continuation without access to this conversation.
 Output ONLY the handoff document. No preamble, no commentary, no wrapper text.
 </critical>
 <instruction>
 Capture exact technical state, not abstractions.
-Include concrete file paths, symbol names, commands run, test results, observed failures, decisions made, and any partial work that materially affects the next step.
+- File paths, symbol names, commands run
+- Test results, observed failures
+- Decisions made
+- Partial work affecting the next step
 </instruction>
 <output>
@@ -32,8 +35,8 @@ Use exactly this structure:
 - **[Decision]**: [Rationale]
 ## Critical Context
-- [Code snippets, file paths, function/type names, error messages, or data essential to continue]
-- [Repository state if relevant]
+- Code snippets, file paths, function/type names, error messages, data essential to continue
+- Repository state if relevant
 ## Next Steps
 1. [What should happen next]