npm - ultimate-pi - Versions diffs - 0.8.0 → 0.9.1 - Mend

ultimate-pi 0.8.0 → 0.9.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/.agents/skills/harness-plan/SKILL.md +6 -6
package/.pi/agents/harness/planner.md +9 -10
package/.pi/extensions/budget-guard.ts +46 -17
package/.pi/extensions/harness-run-context.ts +150 -28
package/.pi/extensions/lib/harness-subagents/harness-subagent-policy.ts +1 -1
package/.pi/extensions/lib/harness-subagents/parent-ask-user-bridge.ts +89 -0
package/.pi/extensions/lib/harness-subagents/spawn-policy.ts +20 -2
package/.pi/extensions/lib/harness-subagents/vendored/agent-manager.ts +1 -0
package/.pi/extensions/lib/harness-subagents/vendored/agent-runner.ts +40 -24
package/.pi/extensions/lib/harness-subagents/vendored/index.ts +21 -0
package/.pi/extensions/policy-gate.ts +4 -4
package/.pi/harness/agents.manifest.json +82 -82
package/.pi/harness/docs/adrs/0031-harness-run-context.md +1 -1
package/.pi/harness/docs/adrs/0032-harness-command-orchestration.md +6 -6
package/.pi/harness/specs/budget-exhausted-event.schema.json +3 -1
package/.pi/harness/specs/harness-turn.schema.json +18 -0
package/.pi/lib/harness-run-context.ts +166 -32
package/.pi/prompts/harness-plan.md +12 -14
package/.pi/scripts/harness-verify.mjs +29 -1
package/CHANGELOG.md +12 -0
package/package.json +2 -2

package/.pi/lib/harness-run-context.ts CHANGED Viewed

@@ -129,6 +129,36 @@ export interface PlanUserApproval {
 	source: "ask_user" | "harness-plan-approval" | "noninteractive";
 }
+/** Persisted on `input` when user invokes a raw `/harness-*` prompt template. */
+export interface HarnessTurnEntry {
+	schema_version: "1.0.0";
+	command: string;
+	args: string;
+	source: "slash";
+	invoked_at: string;
+}
+export const HARNESS_COMMAND_PHASE: Record<string, HarnessPhase> = {
+	"harness-plan": "plan",
+	"harness-auto": "plan",
+	"harness-run": "execute",
+	"harness-eval": "evaluate",
+	"harness-review": "evaluate",
+	"harness-critic": "adversary",
+	"harness-trace": "evaluate",
+	"harness-incident": "evaluate",
+	"harness-drift-replan": "plan",
+	"harness-drift-proceed": "execute",
+	"harness-abort": "plan",
+	"harness-new-run": "plan",
+	"harness-run-status": "plan",
+	"harness-use-run": "plan",
+	"harness-policy-status": "merge",
+	"harness-router-tune": "plan",
+	"harness-budget-status": "plan",
+	"harness-setup": "execute",
+};
 export interface PlanPhaseMutationDecision {
 	allowed: boolean;
 	reason?: string;
@@ -193,11 +223,40 @@ export async function isPlanPhaseScopedWrite(
 	return isCanonicalPlanPacketPath(resolved, projectRoot, runCtx.run_id);
 }
+export function getLatestHarnessTurn(
+	entries: unknown[],
+): HarnessTurnEntry | null {
+	for (let i = entries.length - 1; i >= 0; i--) {
+		const entry = entries[i] as SessionEntryLike;
+		if (entry.type !== "custom" || entry.customType !== "harness-turn") {
+			continue;
+		}
+		const data = entry.data as Partial<HarnessTurnEntry> | undefined;
+		if (data?.command && typeof data.command === "string") {
+			return {
+				schema_version: "1.0.0",
+				command: data.command,
+				args: typeof data.args === "string" ? data.args : "",
+				source: "slash",
+				invoked_at:
+					typeof data.invoked_at === "string" ? data.invoked_at : nowIso(),
+			};
+		}
+	}
+	return null;
+}
 export function indexOfLastPlanCommand(entries: unknown[]): number {
 	for (let i = entries.length - 1; i >= 0; i--) {
 		const entry = entries[i] as SessionEntryLike & {
 			message?: { role?: string; content?: string | unknown[] };
 		};
+		if (entry.type === "custom" && entry.customType === "harness-turn") {
+			const cmd = (entry.data as { command?: string })?.command;
+			if (cmd === "harness-plan" || cmd === "harness-auto") {
+				return i;
+			}
+		}
 		if (
 			entry.type === "custom" &&
 			entry.customType === "harness-plan-attempt"
@@ -221,7 +280,7 @@ export function indexOfLastPlanCommand(entries: unknown[]): number {
 							.join("\n")
 					: "";
 		const visible = userVisiblePromptSlice(text);
-		const parsed = parseHarnessSlashCommand(visible);
+		const parsed = parseHarnessSlashInput(visible);
 		if (
 			parsed?.command === "harness-plan" ||
 			parsed?.command === "harness-auto"
@@ -342,7 +401,7 @@ export function isHarnessAutoSession(entries: unknown[]): boolean {
 			typeof entry.message.content === "string"
 				? userVisiblePromptSlice(entry.message.content)
 				: "";
-		const parsed = parseHarnessSlashCommand(text);
+		const parsed = parseHarnessSlashInput(text);
 		if (parsed?.command === "harness-auto") return true;
 	}
 	return false;
@@ -469,18 +528,16 @@ export function nowIso(): string {
 	return new Date().toISOString();
 }
+/** @deprecated Use parseHarnessSlashInput on raw `input` event text only. */
 export function isHarnessSlashCommand(prompt: string): boolean {
-	const trimmed = prompt.trim();
-	if (!trimmed.startsWith("/harness-")) return false;
-	const match = trimmed.match(/^\/(harness-[a-z0-9-]+)/);
-	if (!match) return false;
-	return HARNESS_COMMANDS.has(match[1]);
+	return parseHarnessSlashInput(prompt) !== null;
 }
-export function parseHarnessSlashCommand(
-	prompt: string,
+/** Parse raw user input before prompt-template expansion (`input` hook only). */
+export function parseHarnessSlashInput(
+	text: string,
 ): { command: string; args: string } | null {
-	const trimmed = prompt.trim();
+	const trimmed = text.trim();
 	const match = trimmed.match(/^\/(harness-[a-z0-9-]+)(?:\s+([\s\S]*))?$/);
 	if (!match) return null;
 	const command = match[1];
@@ -488,6 +545,13 @@ export function parseHarnessSlashCommand(
 	return { command, args: (match[2] ?? "").trim() };
 }
+/** @deprecated Prefer parseHarnessSlashInput on raw input; kept for expanded-prompt fallbacks. */
+export function parseHarnessSlashCommand(
+	prompt: string,
+): { command: string; args: string } | null {
+	return parseHarnessSlashInput(userVisiblePromptSlice(prompt));
+}
 /** User-visible prompt slice for policy signals (exclude injected blocks). */
 export function userVisiblePromptSlice(prompt: string): string {
 	const markers = [
@@ -720,7 +784,32 @@ export function planPacketSummary(
 	};
 }
-export function formatPlanContextBlock(ctx: HarnessRunContext): string {
+export function buildHarnessSpawnContextSnippet(
+	ctx: HarnessRunContext,
+	opts?: { mode?: "create" | "revise"; risk_level?: string; quick?: boolean },
+): string {
+	const mode =
+		opts?.mode ??
+		(ctx.plan_ready || ctx.status === "aborted" ? "revise" : "create");
+	return JSON.stringify(
+		{
+			schema_version: "1.0.0",
+			run_id: ctx.run_id,
+			plan_packet_path: ctx.plan_packet_path,
+			task_summary: ctx.task_summary,
+			mode,
+			risk_level: opts?.risk_level ?? "med",
+			quick: opts?.quick ?? false,
+		},
+		null,
+		2,
+	);
+}
+export function formatPlanContextBlock(
+	ctx: HarnessRunContext,
+	opts?: { mode?: "create" | "revise"; risk_level?: string; quick?: boolean },
+): string {
 	const lines = [
 		"[HarnessRunContext]",
 		`run_id=${ctx.run_id}`,
@@ -735,6 +824,12 @@ export function formatPlanContextBlock(ctx: HarnessRunContext): string {
 	if (ctx.plan_packet_path) {
 		lines.push(`plan_packet_path=${ctx.plan_packet_path}`);
 	}
+	if (ctx.task_summary) {
+		lines.push(`task_summary=${ctx.task_summary}`);
+	}
+	lines.push(
+		`HarnessSpawnContext=${buildHarnessSpawnContextSnippet(ctx, opts)}`,
+	);
 	return lines.join("\n");
 }
@@ -850,7 +945,7 @@ export function shouldReuseHarnessRunId(
 	ctx: HarnessRunContext | null,
 	command: string | null,
 ): boolean {
-	if (!command || !isHarnessSlashCommand(prompt)) return false;
+	if (!command) return false;
 	if (command === "harness-new-run") return false;
 	if (!ctx) return false;
 	if (command === "harness-plan" || command === "harness-auto") {
@@ -875,27 +970,43 @@ export interface HarnessPolicyState {
 	aborted: boolean;
 }
+export function inferHarnessPhaseFromTurn(entries: unknown[]): HarnessPhase | null {
+	const turn = getLatestHarnessTurn(entries);
+	if (!turn) return null;
+	return HARNESS_COMMAND_PHASE[turn.command] ?? null;
+}
+/** Prefer session `harness-turn`; fall back to raw slash in visible prompt only. */
+export function inferHarnessPhase(
+	entries: unknown[],
+	userPrompt?: string,
+): HarnessPhase {
+	const fromTurn = inferHarnessPhaseFromTurn(entries);
+	if (fromTurn) return fromTurn;
+	if (userPrompt) {
+		const parsed = parseHarnessSlashInput(userVisiblePromptSlice(userPrompt));
+		if (parsed && HARNESS_COMMAND_PHASE[parsed.command]) {
+			return HARNESS_COMMAND_PHASE[parsed.command];
+		}
+	}
+	return "execute";
+}
+/** @deprecated Use inferHarnessPhase(entries, prompt) — substring matching causes false plan phase. */
 export function inferHarnessPhaseFromPrompt(prompt: string): HarnessPhase {
-	const p = prompt.toLowerCase();
-	if (
-		p.includes("/harness-plan") ||
-		p.includes("harness-plan") ||
-		p.includes("/harness-auto") ||
-		p.includes("harness-auto")
-	) {
-		return "plan";
+	const p = userVisiblePromptSlice(prompt).toLowerCase();
+	const parsed = parseHarnessSlashInput(userVisiblePromptSlice(prompt));
+	if (parsed && HARNESS_COMMAND_PHASE[parsed.command]) {
+		return HARNESS_COMMAND_PHASE[parsed.command];
 	}
-	if (p.includes("/harness-run") || p.includes("harness-run")) return "execute";
-	if (p.includes("/harness-eval") || p.includes("harness-eval")) {
-		return "evaluate";
+	if (p.startsWith("/harness-plan") || p.startsWith("/harness-auto")) {
+		return "plan";
 	}
-	if (p.includes("/harness-review") || p.includes("harness-review")) {
+	if (p.startsWith("/harness-run")) return "execute";
+	if (p.startsWith("/harness-eval") || p.startsWith("/harness-review")) {
 		return "evaluate";
 	}
-	if (p.includes("/harness-critic") || p.includes("harness-critic")) {
-		return "adversary";
-	}
-	if (p.includes("adversary")) return "adversary";
+	if (p.startsWith("/harness-critic")) return "adversary";
 	if (p.includes("merge gate") || p.includes("policy decision")) return "merge";
 	return "execute";
 }
@@ -914,8 +1025,8 @@ export function isValidHarnessPhaseTransition(
 export function getLatestPolicyState(entries: unknown[]): HarnessPolicyState {
 	const fallback: HarnessPolicyState = {
-		phase: "execute",
-		approvedPlan: true,
+		phase: "plan",
+		approvedPlan: false,
 		planId: null,
 		aborted: false,
 	};
@@ -970,7 +1081,7 @@ export function getPolicyTransitionBlock(
 		return { blocked: false };
 	}
 	const state = getLatestPolicyState(entries);
-	const nextPhase = inferHarnessPhaseFromPrompt(userPrompt);
+	const nextPhase = inferHarnessPhase(entries, userPrompt);
 	if (!isValidHarnessPhaseTransition(state.phase, nextPhase)) {
 		return {
 			blocked: true,
@@ -1014,7 +1125,7 @@ export function isNewTaskPlanBlocked(
 ): boolean {
 	if (ctx.status !== "active") return false;
 	if (isAmendPlanAllowed(ctx, prompt, false)) return false;
-	const cmd = parseHarnessSlashCommand(prompt);
+	const cmd = parseHarnessSlashInput(userVisiblePromptSlice(prompt));
 	if (cmd?.command !== "harness-plan") return false;
 	const taskMatch = prompt.match(/"([^"]+)"/);
 	if (!taskMatch || !ctx.task_summary) return true;
@@ -1137,3 +1248,26 @@ export function driftGateActive(entries: unknown[]): boolean {
 export function phaseTraceFileName(phase: HarnessPhase): string {
 	return `trace-${phase}.json`;
 }
+/** Collect plan approvals from a session entry list (e.g. subagent in-memory session). */
+export function extractPlanApprovalsFromEntries(
+	entries: unknown[],
+): PlanUserApproval[] {
+	const out: PlanUserApproval[] = [];
+	for (let i = 0; i < entries.length; i++) {
+		const entry = entries[i] as SessionEntryLike & {
+			message?: {
+				role?: string;
+				toolName?: string;
+				details?: unknown;
+				content?: { type?: string; text?: string }[];
+			};
+		};
+		if (entry.type !== "message" || entry.message?.role !== "toolResult") {
+			continue;
+		}
+		const fromAsk = parseAskUserApprovalFromMessage(entry.message);
+		if (fromAsk) out.push(fromAsk);
+	}
+	return out;
+}

package/.pi/prompts/harness-plan.md CHANGED Viewed

@@ -5,7 +5,7 @@ argument-hint: "\"<task>\" [--risk low|med|high] [--budget <amount>] [--quick]"
 # harness-plan
-Orchestrator only — spawn `harness/planner`, present draft, run `ask_user`, write plan after Approve. Do **not** plan inline in this session.
+Orchestrator only — spawn `harness/planner` once; planner runs clarification and approval via `ask_user` (parent UI). Write `plan-packet.json` only after approval. Do **not** plan inline in this session.
 ## Step 0 — Parse arguments
@@ -22,39 +22,37 @@ If task is missing:
 ## Active plan context
+Use injected context only — **do not** read `.pi/harness/specs/*.schema.json` or explore specs with bash.
 If `[HarnessActivePlan]` is present:
-- Read current packet from `plan_packet_path` first.
 - Treat task as **revise/amend** unless `/harness-new-run` was used.
-- Pass `mode: revise` in spawn context.
+- Pass `mode: revise` using the `HarnessSpawnContext` JSON in `[HarnessRunContext]`.
-Otherwise use canonical path from `[HarnessRunContext]` for greenfield `mode: create`.
+Otherwise use `HarnessSpawnContext` from `[HarnessRunContext]` for greenfield `mode: create`.
 ## Orchestration (required)
-1. Build `HarnessSpawnContext` JSON (`.pi/harness/specs/harness-spawn-context.schema.json`) from injected run/plan context: `run_id`, `plan_packet_path`, `task_summary`, `risk_level`, `quick`, `mode`.
-2. Spawn with **`inherit_context: false`**:
+1. Copy the `HarnessSpawnContext=…` JSON from `[HarnessRunContext]` into the spawn prompt (adjust `risk_level`, `quick`, `mode` from `$ARGUMENTS` if needed).
+2. Spawn **once** with **`inherit_context: false`**:
 ```
 Agent({ subagent_type: "harness/planner", prompt: "<task + HarnessSpawnContext JSON + output schema>" })
 ```
 3. `get_subagent_result` — parse final JSON (`status`, `plan_packet`, `human_summary`, `clarification`) via fenced `json` block.
-4. If `needs_clarification`, call `ask_user` (harness-decisions) with planner `clarification.options`, then re-spawn with answers.
-5. Present **full** human-readable plan in chat (scope, assumptions, acceptance_checks, rollback_plan, risk_level).
-6. Call `ask_user`: **Approve** / **Request changes** / **Cancel** (harness-decisions). **Do not write** until Approve.
-7. On **Request changes**, re-spawn planner with `mode: revise` and user feedback — do not write file.
-8. **Only after Approve** — write `PlanPacket` JSON to canonical `plan_packet_path`.
+4. If `status === "ready"` and user approved in the subagent (`ask_user` Approve), validate `plan_packet` fields, then **write** `PlanPacket` JSON to canonical `plan_packet_path` from `[HarnessRunContext]`.
+5. If `needs_clarification`, tell the user the planner is waiting — do **not** re-spawn; user should answer in the subagent or re-run `/harness-plan`.
+6. Do **not** call `ask_user` in this parent session for planner clarification or approval.
 ## Parent rules
-- Do not mutate project source files — only `plan-packet.json` after approval.
-- Validate draft against `.pi/harness/specs/plan-packet.schema.json` before `ask_user` Approve.
+- Do not mutate project source files — only `plan-packet.json` after subagent approval is recorded.
 - Do not embed `plan_id=` in prompts for policy sync.
+- Optional: `/harness-plan-commit` if write was blocked but approval exists.
 ## Completion
 - `plan_status`: `ready` or `needs_clarification`
 - `risk_level` used
 - `next_command`: `/harness-run` when `ready` (never `/harness-run --plan …`)
-- If `needs_clarification`, user may reply in chat or re-run `/harness-plan`

package/.pi/scripts/harness-verify.mjs CHANGED Viewed

@@ -5,7 +5,7 @@
 import { readFile, access } from "node:fs/promises";
 import { constants } from "node:fs";
-import { join, dirname } from "node:path";
+import { join, dirname, resolve } from "node:path";
 import { fileURLToPath } from "node:url";
 import { spawn } from "node:child_process";
@@ -22,6 +22,7 @@ const REQUIRED_SCHEMAS = [
 	"run-trace.schema.json",
 	"eval-verdict.schema.json",
 	"harness-spawn-context.schema.json",
+	"harness-turn.schema.json",
 ];
 const REQUIRED_ADRS = [
@@ -201,6 +202,33 @@ async function main() {
 	if (!(await fileExists(runCtxLib))) fail("missing lib/harness-run-context.ts");
 	ok("lib/harness-run-context.ts");
+	const vendoredIndex = join(
+		ROOT,
+		".pi",
+		"extensions",
+		"lib",
+		"harness-subagents",
+		"vendored",
+		"index.ts",
+	);
+	const vendoredSrc = await readFile(vendoredIndex, "utf-8");
+	const runCtxImport = vendoredSrc.match(
+		/from ["']([^"']*harness-run-context\.js)["']/,
+	);
+	if (!runCtxImport) {
+		fail("vendored/index.ts must import harness-run-context.js");
+	}
+	const runCtxImportPath = resolve(
+		dirname(vendoredIndex),
+		runCtxImport[1].replace(/\.js$/, ".ts"),
+	);
+	if (runCtxImportPath !== runCtxLib) {
+		fail(
+			`vendored/index.ts harness-run-context import resolves to ${runCtxImportPath}, expected ${runCtxLib}`,
+		);
+	}
+	ok("vendored/index.ts harness-run-context import path");
 	const policyGateSrc = await readFile(
 		join(ROOT, ".pi", "extensions", "policy-gate.ts"),
 		"utf-8",

package/CHANGELOG.md CHANGED Viewed

@@ -4,6 +4,18 @@ All notable changes to this project are documented in this file.
 ## [Unreleased]
+## [v0.9.1] — 2026-05-17
+### 🐛 Fixes
+- **npm package:** fix `harness-subagents` vendored import of `harness-run-context` (`../../../../lib`); broken installs failed with `Cannot find module '../../../lib/harness-run-context.js'`.
+## [v0.9.0] — 2026-05-17
+### ✨ Features
+- **Harness plan UX:** Pi-native `harness-turn` routing on `input` (no expanded-prompt matching); subagent `ask_user` bridged to parent UI; plan-phase budget cap 80k with debounced exhaustion events; thin `harness-plan` orchestrator with `harness-plan-commit`; `harness-turn.schema.json` and tests.
 ## [v0.8.0] — 2026-05-17
 ### ✨ Features

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "ultimate-pi",
-	"version": "0.8.0",
+	"version": "0.9.1",
 	"description": "Ultimate AI coding harness for pi.dev — extensible skills, Obsidian wiki knowledge layer, compressed context, deterministic output",
 	"keywords": [
 		"pi-package",
@@ -82,7 +82,7 @@
 		"format": "biome format --write",
 		"format:check": "biome format",
 		"prepare": "lefthook install",
-		"test": "node --test test/harness-verify.test.mjs test/harness-ask-user.test.mjs test/harness-subagents-loader.test.mjs test/sentrux-rules-sync.test.mjs && npx -y tsx --test test/harness-vcc-settings.test.ts test/harness-plan-phase-policy.test.mjs test/harness-subagent-policy.test.mjs",
+		"test": "node --test test/harness-verify.test.mjs test/harness-ask-user.test.mjs test/harness-subagents-loader.test.mjs test/harness-subagents-import-path.test.mjs test/sentrux-rules-sync.test.mjs test/harness-budget-guard.test.mjs && npx -y tsx --test test/harness-vcc-settings.test.ts test/harness-plan-phase-policy.test.mjs test/harness-subagent-policy.test.mjs test/harness-turn-routing.test.mjs",
 		"test:vcc": "npx -y tsx --test vendor/pi-vcc/tests/*.test.ts",
 		"harness:sentrux-bootstrap": "node .pi/scripts/harness-sentrux-bootstrap.mjs",
 		"harness:sentrux-sync": "node .pi/scripts/sentrux-rules-sync.mjs --force",