npm - pi-crew - Versions diffs - 0.1.45 → 0.1.46 - Mend

pi-crew 0.1.45 → 0.1.46

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (198) hide show

package/README.md +5 -5
package/agents/analyst.md +1 -1
package/agents/critic.md +1 -1
package/agents/executor.md +1 -1
package/agents/explorer.md +1 -1
package/agents/planner.md +1 -1
package/agents/reviewer.md +1 -1
package/agents/security-reviewer.md +1 -1
package/agents/test-engineer.md +1 -1
package/agents/verifier.md +1 -1
package/agents/writer.md +1 -1
package/docs/next-upgrade-roadmap.md +733 -0
package/docs/refactor-tasks-phase3.md +394 -394
package/docs/refactor-tasks-phase4.md +564 -564
package/docs/refactor-tasks-phase5.md +402 -402
package/docs/refactor-tasks-phase6.md +662 -662
package/docs/research-awesome-agent-skills-distillation.md +100 -0
package/docs/research-extension-examples.md +297 -297
package/docs/research-extension-system.md +324 -324
package/docs/research-oh-my-pi-distillation.md +322 -0
package/docs/research-optimization-plan.md +548 -548
package/docs/research-phase10-distillation.md +198 -198
package/docs/research-phase11-distillation.md +201 -201
package/docs/research-pi-coding-agent.md +357 -357
package/docs/research-source-pi-crew-reference.md +174 -174
package/docs/runtime-flow.md +148 -148
package/docs/source-runtime-refactor-map.md +107 -83
package/docs/usage.md +3 -3
package/index.ts +6 -6
package/install.mjs +52 -8
package/package.json +1 -1
package/schema.json +2 -1
package/skills/async-worker-recovery/SKILL.md +42 -0
package/skills/context-artifact-hygiene/SKILL.md +52 -0
package/skills/delegation-patterns/SKILL.md +54 -0
package/skills/mailbox-interactive/SKILL.md +40 -0
package/skills/model-routing-context/SKILL.md +39 -0
package/skills/multi-perspective-review/SKILL.md +58 -0
package/skills/observability-reliability/SKILL.md +41 -0
package/skills/ownership-session-security/SKILL.md +41 -0
package/skills/pi-extension-lifecycle/SKILL.md +39 -0
package/skills/requirements-to-task-packet/SKILL.md +63 -0
package/skills/resource-discovery-config/SKILL.md +41 -0
package/skills/runtime-state-reader/SKILL.md +44 -0
package/skills/secure-agent-orchestration-review/SKILL.md +45 -0
package/skills/state-mutation-locking/SKILL.md +42 -0
package/skills/systematic-debugging/SKILL.md +67 -0
package/skills/ui-render-performance/SKILL.md +39 -0
package/skills/verification-before-done/SKILL.md +57 -0
package/skills/worktree-isolation/SKILL.md +39 -0
package/src/agents/agent-serializer.ts +34 -34
package/src/agents/discover-agents.ts +12 -11
package/src/config/config.ts +48 -24
package/src/config/defaults.ts +14 -0
package/src/extension/cross-extension-rpc.ts +82 -82
package/src/extension/project-init.ts +62 -2
package/src/extension/register.ts +11 -9
package/src/extension/registration/commands.ts +32 -25
package/src/extension/registration/compaction-guard.ts +125 -125
package/src/extension/registration/subagent-helpers.ts +8 -0
package/src/extension/registration/subagent-tools.ts +149 -148
package/src/extension/registration/team-tool.ts +8 -6
package/src/extension/run-bundle-schema.ts +89 -89
package/src/extension/run-index.ts +13 -5
package/src/extension/run-maintenance.ts +62 -43
package/src/extension/team-tool/api.ts +25 -8
package/src/extension/team-tool/cancel.ts +33 -4
package/src/extension/team-tool/context.ts +5 -0
package/src/extension/team-tool/handle-settings.ts +188 -188
package/src/extension/team-tool/inspect.ts +41 -41
package/src/extension/team-tool/lifecycle-actions.ts +91 -79
package/src/extension/team-tool/plan.ts +19 -19
package/src/extension/team-tool/respond.ts +37 -17
package/src/extension/team-tool/run.ts +52 -10
package/src/extension/team-tool/status.ts +12 -1
package/src/extension/team-tool-types.ts +2 -0
package/src/extension/team-tool.ts +32 -11
package/src/i18n.ts +184 -184
package/src/observability/event-to-metric.ts +8 -1
package/src/observability/exporters/otlp-exporter.ts +77 -77
package/src/prompt/prompt-runtime.ts +72 -72
package/src/runtime/agent-control.ts +63 -63
package/src/runtime/agent-memory.ts +72 -72
package/src/runtime/agent-observability.ts +114 -114
package/src/runtime/async-marker.ts +26 -26
package/src/runtime/attention-events.ts +28 -28
package/src/runtime/background-runner.ts +59 -53
package/src/runtime/cancellation.ts +51 -0
package/src/runtime/child-pi.ts +457 -444
package/src/runtime/completion-guard.ts +190 -190
package/src/runtime/crash-recovery.ts +1 -0
package/src/runtime/crew-agent-records.ts +38 -6
package/src/runtime/deadletter.ts +1 -0
package/src/runtime/delivery-coordinator.ts +46 -25
package/src/runtime/direct-run.ts +35 -35
package/src/runtime/effectiveness.ts +76 -0
package/src/runtime/foreground-control.ts +82 -82
package/src/runtime/green-contract.ts +46 -46
package/src/runtime/group-join.ts +106 -106
package/src/runtime/heartbeat-gradient.ts +28 -28
package/src/runtime/heartbeat-watcher.ts +124 -124
package/src/runtime/live-agent-control.ts +88 -87
package/src/runtime/live-agent-manager.ts +103 -85
package/src/runtime/live-control-realtime.ts +36 -36
package/src/runtime/live-session-runtime.ts +309 -305
package/src/runtime/manifest-cache.ts +17 -2
package/src/runtime/model-fallback.ts +6 -4
package/src/runtime/parallel-research.ts +44 -44
package/src/runtime/pi-args.ts +18 -3
package/src/runtime/pi-json-output.ts +111 -111
package/src/runtime/policy-engine.ts +79 -79
package/src/runtime/process-status.ts +5 -1
package/src/runtime/progress-event-coalescer.ts +43 -43
package/src/runtime/recovery-recipes.ts +74 -74
package/src/runtime/retry-executor.ts +81 -64
package/src/runtime/role-permission.ts +39 -39
package/src/runtime/runtime-resolver.ts +22 -6
package/src/runtime/session-resources.ts +25 -25
package/src/runtime/session-snapshot.ts +59 -59
package/src/runtime/session-usage.ts +79 -79
package/src/runtime/sidechain-output.ts +29 -29
package/src/runtime/skill-instructions.ts +222 -0
package/src/runtime/stale-reconciler.ts +4 -14
package/src/runtime/subagent-manager.ts +3 -0
package/src/runtime/supervisor-contact.ts +59 -59
package/src/runtime/task-display.ts +38 -38
package/src/runtime/task-output-context.ts +127 -127
package/src/runtime/task-runner/capabilities.ts +78 -0
package/src/runtime/task-runner/live-executor.ts +105 -101
package/src/runtime/task-runner/progress.ts +119 -119
package/src/runtime/task-runner/prompt-builder.ts +3 -1
package/src/runtime/task-runner/prompt-pipeline.ts +64 -0
package/src/runtime/task-runner/result-utils.ts +14 -14
package/src/runtime/task-runner/state-helpers.ts +22 -22
package/src/runtime/task-runner.ts +44 -5
package/src/runtime/team-runner.ts +78 -15
package/src/runtime/worker-heartbeat.ts +21 -21
package/src/runtime/worker-startup.ts +57 -57
package/src/schema/config-schema.ts +1 -0
package/src/schema/team-tool-schema.ts +3 -3
package/src/state/active-run-registry.ts +165 -0
package/src/state/contracts.ts +1 -1
package/src/state/mailbox.ts +44 -4
package/src/state/state-store.ts +8 -1
package/src/state/task-claims.ts +44 -44
package/src/state/types.ts +44 -2
package/src/state/usage.ts +29 -29
package/src/subagents/async-entry.ts +1 -1
package/src/subagents/index.ts +3 -3
package/src/subagents/live/control.ts +1 -1
package/src/subagents/live/manager.ts +1 -1
package/src/subagents/live/realtime.ts +1 -1
package/src/subagents/live/session-runtime.ts +1 -1
package/src/subagents/manager.ts +1 -1
package/src/subagents/spawn.ts +1 -1
package/src/teams/team-config.ts +1 -0
package/src/teams/team-serializer.ts +38 -38
package/src/types/diff.d.ts +18 -18
package/src/ui/crew-footer.ts +101 -101
package/src/ui/crew-select-list.ts +111 -111
package/src/ui/crew-widget.ts +4 -3
package/src/ui/dashboard-panes/metrics-pane.ts +34 -34
package/src/ui/dashboard-panes/progress-pane.ts +2 -0
package/src/ui/dynamic-border.ts +25 -25
package/src/ui/layout-primitives.ts +106 -106
package/src/ui/loaders.ts +158 -158
package/src/ui/render-diff.ts +119 -119
package/src/ui/render-scheduler.ts +143 -143
package/src/ui/run-snapshot-cache.ts +10 -2
package/src/ui/snapshot-types.ts +2 -0
package/src/ui/spinner.ts +17 -17
package/src/ui/status-colors.ts +58 -58
package/src/ui/syntax-highlight.ts +116 -116
package/src/utils/atomic-write.ts +33 -33
package/src/utils/completion-dedupe.ts +63 -63
package/src/utils/frontmatter.ts +68 -68
package/src/utils/git.ts +262 -262
package/src/utils/ids.ts +12 -12
package/src/utils/names.ts +27 -27
package/src/utils/paths.ts +4 -2
package/src/utils/redaction.ts +44 -44
package/src/utils/safe-paths.ts +47 -47
package/src/utils/sleep.ts +32 -32
package/src/workflows/validate-workflow.ts +40 -40
package/src/workflows/workflow-config.ts +1 -0
package/src/worktree/branch-freshness.ts +45 -45
package/teams/default.team.md +12 -12
package/teams/fast-fix.team.md +11 -11
package/teams/implementation.team.md +18 -18
package/teams/parallel-research.team.md +14 -14
package/teams/research.team.md +11 -11
package/teams/review.team.md +12 -12
package/workflows/default.workflow.md +29 -29
package/workflows/fast-fix.workflow.md +22 -22
package/workflows/implementation.workflow.md +38 -38
package/workflows/parallel-research.workflow.md +46 -46
package/workflows/research.workflow.md +22 -22
package/workflows/review.workflow.md +30 -30

package/src/runtime/completion-guard.ts CHANGED Viewed

@@ -1,190 +1,190 @@
-import * as fs from "node:fs";
-import type { TeamTaskState, TeamRunManifest } from "../state/types.ts";
-// ============================================================================
-// Phase 1.2: Completion Mutation Guard — detects tasks that claim success but
-// made no observable mutations. Used by task-runner.ts.
-// ============================================================================
-export interface CompletionMutationGuardInput {
-	role: string;
-	taskText?: string;
-	transcriptPath?: string;
-	stdout?: string;
-}
-export interface CompletionMutationGuardResult {
-	expectedMutation: boolean;
-	observedMutation: boolean;
-	reason?: "no_mutation_observed";
-	observedTools: string[];
-}
-const MUTATING_ROLES = new Set(["executor", "test-engineer"]);
-const MUTATING_TOOLS = new Set(["edit", "write", "multi_edit", "apply_patch", "replace_in_file", "insert", "delete_files", "create_file", "overwrite", "patch"]);
-const READ_ONLY_COMMANDS = /^(pwd|ls|dir|cat|type|sed|grep|rg|find|git\s+(status|diff|log|show|branch|remote|rev-parse|ls-files)|npm\s+(test|run\s+(typecheck|check|lint|test|ci))|node\s+--test)\b/i;
-const MUTATING_COMMANDS = /\b(rm\s+-|del\s+|erase\s+|mv\s+|move\s+|cp\s+|copy\s+|mkdir\b|touch\b|git\s+(add|commit|push|reset|clean|checkout|switch|merge|rebase|stash)|npm\s+(install|i|uninstall|publish|version)|pnpm\s+(add|install|remove)|yarn\s+(add|install|remove)|python\b.*>|node\b.*>|echo\b.*>|Set-Content|Out-File|sed\s+-i|tee\b|dd\b.*of=|wget\b.*-O|curl\b.*-o)\b/i;
-const READ_ONLY_HINTS = /\b(read-only|no edits?|do not edit|không sửa|khong sua|chỉ đọc|chi doc|plan only|chỉ lập plan|review only|audit only)\b/i;
-function asRecord(value: unknown): Record<string, unknown> | undefined {
-	return value && typeof value === "object" && !Array.isArray(value) ? value as Record<string, unknown> : undefined;
-}
-function commandText(value: unknown): string {
-	const record = asRecord(value);
-	if (!record) return typeof value === "string" ? value : "";
-	for (const key of ["command", "cmd", "script", "input"]) {
-		const raw = record[key];
-		if (typeof raw === "string") return raw;
-	}
-	return JSON.stringify(record);
-}
-function isMutatingTool(tool: string, args: unknown): boolean {
-	const normalized = tool.toLowerCase();
-	if (MUTATING_TOOLS.has(normalized)) return true;
-	if (normalized === "bash" || normalized === "shell" || normalized === "powershell") {
-		const command = commandText(args).trim();
-		if (!command) return false;
-		// Check mutating patterns first: sed -i is mutating even though plain sed is read-only.
-		if (MUTATING_COMMANDS.test(command)) return true;
-		if (READ_ONLY_COMMANDS.test(command)) return false;
-		// If the command doesn't match either list, treat unknown bash calls as potentially mutating.
-		return true;
-	}
-	return false;
-}
-function collectToolCallsFromEvent(event: unknown): Array<{ tool: string; args?: unknown }> {
-	const record = asRecord(event);
-	if (!record) return [];
-	const calls: Array<{ tool: string; args?: unknown }> = [];
-	const directTool = record.toolName ?? record.name ?? record.tool;
-	if (typeof directTool === "string" && (record.type === "tool_execution_start" || record.type === "toolCall" || record.type === "tool_call")) {
-		calls.push({ tool: directTool, args: record.args ?? record.input });
-	}
-	const content = Array.isArray(record.content) ? record.content : asRecord(record.message)?.content;
-	if (Array.isArray(content)) {
-		for (const part of content) {
-			const item = asRecord(part);
-			if (!item) continue;
-			const tool = item.name ?? item.toolName ?? item.tool;
-			if (typeof tool === "string" && (item.type === "toolCall" || item.type === "tool_call" || item.type === "tool_execution_start")) calls.push({ tool, args: item.input ?? item.args });
-		}
-	}
-	return calls;
-}
-function transcriptText(input: CompletionMutationGuardInput): string {
-	if (input.transcriptPath && fs.existsSync(input.transcriptPath)) return fs.readFileSync(input.transcriptPath, "utf-8");
-	return input.stdout ?? "";
-}
-export function expectsImplementationMutation(input: Pick<CompletionMutationGuardInput, "role" | "taskText">): boolean {
-	if (!MUTATING_ROLES.has(input.role)) return false;
-	return !READ_ONLY_HINTS.test(input.taskText ?? "");
-}
-export function evaluateCompletionMutationGuard(input: CompletionMutationGuardInput): CompletionMutationGuardResult {
-	const expectedMutation = expectsImplementationMutation(input);
-	const observedTools: string[] = [];
-	let observedMutation = false;
-	const text = transcriptText(input);
-	for (const line of text.split("\n")) {
-		const trimmed = line.trim();
-		if (!trimmed) continue;
-		let event: unknown;
-		try { event = JSON.parse(trimmed); } catch { continue; }
-		for (const call of collectToolCallsFromEvent(event)) {
-			observedTools.push(call.tool);
-			if (isMutatingTool(call.tool, call.args)) observedMutation = true;
-		}
-	}
-	return {
-		expectedMutation,
-		observedMutation,
-		observedTools,
-		...(expectedMutation && !observedMutation ? { reason: "no_mutation_observed" as const } : {}),
-	};
-}
-// ============================================================================
-// Phase 11a: Artifact-based Completion Verification — a second layer that
-// checks whether a completed task actually produced meaningful artifacts.
-// ============================================================================
-/**
- * Guard against false-positive task completions.
- *
- * Checks whether a task that claims success actually produced meaningful output.
- * Returns a verification result with the green level (0-3) and any warnings.
- */
-export interface CompletionVerifyResult {
-	/** 0 = no output, 1 = minimal, 2 = moderate, 3 = strong */
-	greenLevel: number;
-	/** Warnings about potentially incomplete work */
-	warnings: string[];
-}
-const MAX_OUTPUT_PREVIEW = 200;
-function isTrivialError(error: string | undefined): boolean {
-	if (!error) return false;
-	return error.trim().length === 0;
-}
-export function verifyTaskCompletion(
-	task: TeamTaskState,
-	manifest: TeamRunManifest,
-): CompletionVerifyResult {
-	const warnings: string[] = [];
-	let greenLevel = 0;
-	// Check 1: Has an error?
-	if (task.error && !isTrivialError(task.error)) {
-		return { greenLevel: 0, warnings: [`Task has error: ${task.error}`] };
-	}
-	// Check 2: Has result artifact?
-	if (task.resultArtifact) {
-		greenLevel += 1;
-	}
-	// Check 3: Has transcript?
-	if (task.transcriptArtifact) {
-		greenLevel += 1;
-	}
-	// Check 4: For implementation tasks, verify artifacts were actually produced
-	const runArtifacts = manifest.artifacts.filter(
-		(a) => a.producer === task.id || a.producer === task.agent,
-	);
-	if (runArtifacts.length > 0) {
-		greenLevel += 1;
-	} else if (greenLevel < 3) {
-		warnings.push("No run-level artifacts produced by this task");
-	}
-	// Check 5: Usage tracking — did the task actually consume tokens?
-	if (task.usage) {
-		const totalTokens = (task.usage.input ?? 0) + (task.usage.output ?? 0);
-		if (totalTokens === 0 && greenLevel < 3) {
-			warnings.push("Task reports zero token usage — may not have executed");
-		}
-	}
-	return {
-		greenLevel: Math.min(greenLevel, 3),
-		warnings,
-	};
-}
-/**
- * Format a preview of task output for diagnostic display.
- */
-export function formatOutputPreview(output: string | undefined): string {
-	if (!output) return "(no output)";
-	const trimmed = output.trim();
-	if (trimmed.length <= MAX_OUTPUT_PREVIEW) return trimmed;
-	return trimmed.slice(0, MAX_OUTPUT_PREVIEW) + "...";
-}
+import * as fs from "node:fs";
+import type { TeamTaskState, TeamRunManifest } from "../state/types.ts";
+// ============================================================================
+// Phase 1.2: Completion Mutation Guard — detects tasks that claim success but
+// made no observable mutations. Used by task-runner.ts.
+// ============================================================================
+export interface CompletionMutationGuardInput {
+	role: string;
+	taskText?: string;
+	transcriptPath?: string;
+	stdout?: string;
+}
+export interface CompletionMutationGuardResult {
+	expectedMutation: boolean;
+	observedMutation: boolean;
+	reason?: "no_mutation_observed";
+	observedTools: string[];
+}
+const MUTATING_ROLES = new Set(["executor", "test-engineer"]);
+const MUTATING_TOOLS = new Set(["edit", "write", "multi_edit", "apply_patch", "replace_in_file", "insert", "delete_files", "create_file", "overwrite", "patch"]);
+const READ_ONLY_COMMANDS = /^(pwd|ls|dir|cat|type|sed|grep|rg|find|git\s+(status|diff|log|show|branch|remote|rev-parse|ls-files)|npm\s+(test|run\s+(typecheck|check|lint|test|ci))|node\s+--test)\b/i;
+const MUTATING_COMMANDS = /\b(rm\s+-|del\s+|erase\s+|mv\s+|move\s+|cp\s+|copy\s+|mkdir\b|touch\b|git\s+(add|commit|push|reset|clean|checkout|switch|merge|rebase|stash)|npm\s+(install|i|uninstall|publish|version)|pnpm\s+(add|install|remove)|yarn\s+(add|install|remove)|python\b.*>|node\b.*>|echo\b.*>|Set-Content|Out-File|sed\s+-i|tee\b|dd\b.*of=|wget\b.*-O|curl\b.*-o)\b/i;
+const READ_ONLY_HINTS = /\b(read-only|no edits?|do not edit|không sửa|khong sua|chỉ đọc|chi doc|plan only|chỉ lập plan|review only|audit only)\b/i;
+function asRecord(value: unknown): Record<string, unknown> | undefined {
+	return value && typeof value === "object" && !Array.isArray(value) ? value as Record<string, unknown> : undefined;
+}
+function commandText(value: unknown): string {
+	const record = asRecord(value);
+	if (!record) return typeof value === "string" ? value : "";
+	for (const key of ["command", "cmd", "script", "input"]) {
+		const raw = record[key];
+		if (typeof raw === "string") return raw;
+	}
+	return JSON.stringify(record);
+}
+function isMutatingTool(tool: string, args: unknown): boolean {
+	const normalized = tool.toLowerCase();
+	if (MUTATING_TOOLS.has(normalized)) return true;
+	if (normalized === "bash" || normalized === "shell" || normalized === "powershell") {
+		const command = commandText(args).trim();
+		if (!command) return false;
+		// Check mutating patterns first: sed -i is mutating even though plain sed is read-only.
+		if (MUTATING_COMMANDS.test(command)) return true;
+		if (READ_ONLY_COMMANDS.test(command)) return false;
+		// If the command doesn't match either list, treat unknown bash calls as potentially mutating.
+		return true;
+	}
+	return false;
+}
+function collectToolCallsFromEvent(event: unknown): Array<{ tool: string; args?: unknown }> {
+	const record = asRecord(event);
+	if (!record) return [];
+	const calls: Array<{ tool: string; args?: unknown }> = [];
+	const directTool = record.toolName ?? record.name ?? record.tool;
+	if (typeof directTool === "string" && (record.type === "tool_execution_start" || record.type === "toolCall" || record.type === "tool_call")) {
+		calls.push({ tool: directTool, args: record.args ?? record.input });
+	}
+	const content = Array.isArray(record.content) ? record.content : asRecord(record.message)?.content;
+	if (Array.isArray(content)) {
+		for (const part of content) {
+			const item = asRecord(part);
+			if (!item) continue;
+			const tool = item.name ?? item.toolName ?? item.tool;
+			if (typeof tool === "string" && (item.type === "toolCall" || item.type === "tool_call" || item.type === "tool_execution_start")) calls.push({ tool, args: item.input ?? item.args });
+		}
+	}
+	return calls;
+}
+function transcriptText(input: CompletionMutationGuardInput): string {
+	if (input.transcriptPath && fs.existsSync(input.transcriptPath)) return fs.readFileSync(input.transcriptPath, "utf-8");
+	return input.stdout ?? "";
+}
+export function expectsImplementationMutation(input: Pick<CompletionMutationGuardInput, "role" | "taskText">): boolean {
+	if (!MUTATING_ROLES.has(input.role)) return false;
+	return !READ_ONLY_HINTS.test(input.taskText ?? "");
+}
+export function evaluateCompletionMutationGuard(input: CompletionMutationGuardInput): CompletionMutationGuardResult {
+	const expectedMutation = expectsImplementationMutation(input);
+	const observedTools: string[] = [];
+	let observedMutation = false;
+	const text = transcriptText(input);
+	for (const line of text.split("\n")) {
+		const trimmed = line.trim();
+		if (!trimmed) continue;
+		let event: unknown;
+		try { event = JSON.parse(trimmed); } catch { continue; }
+		for (const call of collectToolCallsFromEvent(event)) {
+			observedTools.push(call.tool);
+			if (isMutatingTool(call.tool, call.args)) observedMutation = true;
+		}
+	}
+	return {
+		expectedMutation,
+		observedMutation,
+		observedTools,
+		...(expectedMutation && !observedMutation ? { reason: "no_mutation_observed" as const } : {}),
+	};
+}
+// ============================================================================
+// Phase 11a: Artifact-based Completion Verification — a second layer that
+// checks whether a completed task actually produced meaningful artifacts.
+// ============================================================================
+/**
+ * Guard against false-positive task completions.
+ *
+ * Checks whether a task that claims success actually produced meaningful output.
+ * Returns a verification result with the green level (0-3) and any warnings.
+ */
+export interface CompletionVerifyResult {
+	/** 0 = no output, 1 = minimal, 2 = moderate, 3 = strong */
+	greenLevel: number;
+	/** Warnings about potentially incomplete work */
+	warnings: string[];
+}
+const MAX_OUTPUT_PREVIEW = 200;
+function isTrivialError(error: string | undefined): boolean {
+	if (!error) return false;
+	return error.trim().length === 0;
+}
+export function verifyTaskCompletion(
+	task: TeamTaskState,
+	manifest: TeamRunManifest,
+): CompletionVerifyResult {
+	const warnings: string[] = [];
+	let greenLevel = 0;
+	// Check 1: Has an error?
+	if (task.error && !isTrivialError(task.error)) {
+		return { greenLevel: 0, warnings: [`Task has error: ${task.error}`] };
+	}
+	// Check 2: Has result artifact?
+	if (task.resultArtifact) {
+		greenLevel += 1;
+	}
+	// Check 3: Has transcript?
+	if (task.transcriptArtifact) {
+		greenLevel += 1;
+	}
+	// Check 4: For implementation tasks, verify artifacts were actually produced
+	const runArtifacts = manifest.artifacts.filter(
+		(a) => a.producer === task.id || a.producer === task.agent,
+	);
+	if (runArtifacts.length > 0) {
+		greenLevel += 1;
+	} else if (greenLevel < 3) {
+		warnings.push("No run-level artifacts produced by this task");
+	}
+	// Check 5: Usage tracking — did the task actually consume tokens?
+	if (task.usage) {
+		const totalTokens = (task.usage.input ?? 0) + (task.usage.output ?? 0);
+		if (totalTokens === 0 && greenLevel < 3) {
+			warnings.push("Task reports zero token usage — may not have executed");
+		}
+	}
+	return {
+		greenLevel: Math.min(greenLevel, 3),
+		warnings,
+	};
+}
+/**
+ * Format a preview of task output for diagnostic display.
+ */
+export function formatOutputPreview(output: string | undefined): string {
+	if (!output) return "(no output)";
+	const trimmed = output.trim();
+	if (trimmed.length <= MAX_OUTPUT_PREVIEW) return trimmed;
+	return trimmed.slice(0, MAX_OUTPUT_PREVIEW) + "...";
+}

package/src/runtime/crash-recovery.ts CHANGED Viewed

@@ -75,6 +75,7 @@ export function reconcileAllStaleRuns(cwd: string, manifestCache: ManifestCache,
 			if (!fresh || fresh.manifest.status !== "running") return;
 			const result = reconcileStaleRun(fresh.manifest, fresh.tasks, now);
 			if (result.repaired) {
+				if (result.repairedTasks) saveRunTasks(fresh.manifest, result.repairedTasks);
 				updateRunStatus(fresh.manifest, "failed", `Stale run reconciled: ${result.detail}`);
 				appendEvent(fresh.manifest.eventsPath, { type: "crew.run.reconciled_stale", runId: manifest.runId, message: result.detail, data: { verdict: result.verdict } });
 			}

package/src/runtime/crew-agent-records.ts CHANGED Viewed

@@ -61,6 +61,23 @@ export function agentOutputPath(manifest: TeamRunManifest, taskId: string): stri
 }
 const AGENT_READER_TTL_MS = 200;
+const ASYNC_AGENT_READER_CACHE_MAX_ENTRIES = 128;
+const asyncAgentReaderCache = new Map<string, { expiresAt: number; records: CrewAgentRecord[]; inFlight?: Promise<CrewAgentRecord[]> }>();
+function setAsyncAgentReaderCache(filePath: string, entry: { expiresAt: number; records: CrewAgentRecord[]; inFlight?: Promise<CrewAgentRecord[]> }): void {
+	const now = Date.now();
+	for (const [key, cached] of asyncAgentReaderCache) {
+		if (cached.expiresAt <= now && !cached.inFlight) asyncAgentReaderCache.delete(key);
+	}
+	if (asyncAgentReaderCache.has(filePath)) asyncAgentReaderCache.delete(filePath);
+	asyncAgentReaderCache.set(filePath, entry);
+	while (asyncAgentReaderCache.size > ASYNC_AGENT_READER_CACHE_MAX_ENTRIES) {
+		const oldest = asyncAgentReaderCache.keys().next().value;
+		if (!oldest) break;
+		asyncAgentReaderCache.delete(oldest);
+	}
+}
 export function readCrewAgents(manifest: TeamRunManifest): CrewAgentRecord[] {
 	try {
@@ -71,16 +88,31 @@ export function readCrewAgents(manifest: TeamRunManifest): CrewAgentRecord[] {
 }
 export async function readCrewAgentsAsync(manifest: TeamRunManifest): Promise<CrewAgentRecord[]> {
-	try {
-		return JSON.parse(await fs.promises.readFile(agentsPath(manifest), "utf-8")) as CrewAgentRecord[];
-	} catch {
-		return [];
-	}
+	const filePath = agentsPath(manifest);
+	const now = Date.now();
+	const cached = asyncAgentReaderCache.get(filePath);
+	if (cached && cached.expiresAt > now) return cached.records;
+	if (cached?.inFlight) return cached.inFlight;
+	const inFlight = (async (): Promise<CrewAgentRecord[]> => {
+		try {
+			const parsed = JSON.parse(await fs.promises.readFile(filePath, "utf-8")) as unknown;
+			const records = Array.isArray(parsed) ? redactSecrets(parsed) as CrewAgentRecord[] : [];
+			setAsyncAgentReaderCache(filePath, { expiresAt: Date.now() + AGENT_READER_TTL_MS, records });
+			return records;
+		} catch {
+			setAsyncAgentReaderCache(filePath, { expiresAt: Date.now() + AGENT_READER_TTL_MS, records: [] });
+			return [];
+		}
+	})();
+	setAsyncAgentReaderCache(filePath, { expiresAt: now + AGENT_READER_TTL_MS, records: cached?.records ?? [], inFlight });
+	return inFlight;
 }
 export function saveCrewAgents(manifest: TeamRunManifest, records: CrewAgentRecord[]): void {
 	fs.mkdirSync(manifest.stateRoot, { recursive: true });
-	atomicWriteJson(agentsPath(manifest), redactSecrets(records));
+	const filePath = agentsPath(manifest);
+	atomicWriteJson(filePath, redactSecrets(records));
+	asyncAgentReaderCache.delete(filePath);
 	for (const record of records) writeCrewAgentStatus(manifest, record);
 }

package/src/runtime/deadletter.ts CHANGED Viewed

@@ -12,6 +12,7 @@ export interface DeadletterEntry {
 	reason: DeadletterReason;
 	attempts: number;
 	lastError?: string;
+	attemptId?: string;
 	timestamp: string;
 }

package/src/runtime/delivery-coordinator.ts CHANGED Viewed

@@ -25,6 +25,7 @@ export class DeliveryCoordinator {
 	private active = false;
 	private generation = 0;
 	private pending: PendingDelivery[] = [];
+	private flushing = false;
 	private readonly deps: DeliveryCoordinatorDeps;
 	private ttlTimer: ReturnType<typeof setInterval> | undefined;
@@ -63,7 +64,7 @@ export class DeliveryCoordinator {
 				logInternalError("delivery-coordinator.deliverResult", error, `runId=${runId}`);
 			}
 		}
-		this.enqueue({ runId, payload: result, timestamp: Date.now(), type: "result" });
+		if (!this.flushing) this.enqueue({ runId, payload: result, timestamp: Date.now(), type: "result" });
 	}
 	deliverNotification(notification: NotificationDescriptor): void {
@@ -84,7 +85,7 @@ export class DeliveryCoordinator {
 			}
 			return;
 		}
-		this.enqueue({ runId: notification.runId ?? "", payload: notification, timestamp: Date.now(), type: "notification" });
+		if (!this.flushing) this.enqueue({ runId: notification.runId ?? "", payload: notification, timestamp: Date.now(), type: "notification" });
 	}
 	deliverSteer(runId: string, message: string): void {
@@ -96,36 +97,30 @@ export class DeliveryCoordinator {
 				logInternalError("delivery-coordinator.deliverSteer", error, `runId=${runId}`);
 			}
 		}
-		this.enqueue({ runId, payload: message, timestamp: Date.now(), type: "steer" });
+		if (!this.flushing) this.enqueue({ runId, payload: message, timestamp: Date.now(), type: "steer" });
 	}
 	flushQueuedResults(): void {
 		if (!this.active || this.pending.length === 0) return;
 		const batch = this.pending.splice(0);
-		for (const delivery of batch) {
-			if (delivery.generation !== undefined && delivery.generation !== this.generation) {
-				logInternalError("delivery-coordinator.flush.stale", undefined, `runId=${delivery.runId} type=${delivery.type}`);
-				continue;
-			}
-			try {
-				switch (delivery.type) {
-					case "result":
-						this.deliverResult(delivery.runId, delivery.payload);
-						break;
-					case "notification": {
-						const notification = delivery.payload as NotificationDescriptor;
-						this.deliverNotification(notification);
-						break;
-					}
-					case "steer": {
-						const message = typeof delivery.payload === "string" ? delivery.payload : String(delivery.payload);
-						this.deliverSteer(delivery.runId, message);
-						break;
-					}
+		this.flushing = true;
+		try {
+			const retryLater: PendingDelivery[] = [];
+			for (const delivery of batch) {
+				if (delivery.type === "steer" && delivery.generation !== undefined && delivery.generation !== this.generation) {
+					logInternalError("delivery-coordinator.flush.stale", undefined, `runId=${delivery.runId} type=${delivery.type}`);
+					continue;
+				}
+				try {
+					if (!this.deliverQueued(delivery)) retryLater.push({ ...delivery, generation: this.generation });
+				} catch (error) {
+					logInternalError("delivery-coordinator.flush", error, `runId=${delivery.runId} type=${delivery.type}`);
+					retryLater.push({ ...delivery, generation: this.generation });
 				}
-			} catch (error) {
-				logInternalError("delivery-coordinator.flush", error, `runId=${delivery.runId} type=${delivery.type}`);
 			}
+			this.pending.unshift(...retryLater);
+		} finally {
+			this.flushing = false;
 		}
 	}
@@ -138,6 +133,32 @@ export class DeliveryCoordinator {
 		}
 	}
+	private deliverQueued(delivery: PendingDelivery): boolean {
+		switch (delivery.type) {
+			case "result":
+				if (!this.deps.emit) return false;
+				this.deps.emit("pi-crew:run-result", delivery.payload);
+				return true;
+			case "notification": {
+				const notification = delivery.payload as NotificationDescriptor;
+				if (!this.deps.sendFollowUp) return false;
+				this.deps.sendFollowUp(notification.title, notification.body ?? "");
+				try {
+					this.deps.emit?.("pi-crew:notification", notification);
+				} catch {
+					// Secondary event delivery must not consume the user-facing notification.
+				}
+				return true;
+			}
+			case "steer": {
+				if (!this.deps.sendWakeUp) return false;
+				const message = typeof delivery.payload === "string" ? delivery.payload : String(delivery.payload);
+				this.deps.sendWakeUp(message);
+				return true;
+			}
+		}
+	}
 	private enqueue(delivery: PendingDelivery): void {
 		this.pending.push({ ...delivery, generation: this.generation });
 	}

package/src/runtime/direct-run.ts CHANGED Viewed

@@ -1,35 +1,35 @@
-import type { AgentConfig } from "../agents/agent-config.ts";
-import type { TeamRunManifest, TeamTaskState } from "../state/types.ts";
-import type { TeamConfig } from "../teams/team-config.ts";
-import type { WorkflowConfig } from "../workflows/workflow-config.ts";
-export function isDirectRun(manifest: Pick<TeamRunManifest, "team" | "workflow">): boolean {
-	return manifest.workflow === "direct-agent";
-}
-export function directTeamAndWorkflowFromRun(manifest: TeamRunManifest, tasks: TeamTaskState[], agents: AgentConfig[]): { team: TeamConfig; workflow: WorkflowConfig } | undefined {
-	if (!isDirectRun(manifest)) return undefined;
-	const firstTask = tasks[0];
-	const agentName = firstTask?.agent ?? (manifest.team.replace(/^direct-/, "") || "executor");
-	const agent = agents.find((candidate) => candidate.name === agentName);
-	const role = firstTask?.role ?? "agent";
-	const stepId = firstTask?.stepId ?? "01_agent";
-	return {
-		team: {
-			name: manifest.team,
-			description: `Direct subagent run for ${agentName}`,
-			source: "builtin",
-			filePath: "<generated>",
-			roles: [{ name: role, agent: agentName, description: agent?.description }],
-			defaultWorkflow: "direct-agent",
-			workspaceMode: manifest.workspaceMode,
-		},
-		workflow: {
-			name: manifest.workflow ?? "direct-agent",
-			description: `Direct task for ${agentName}`,
-			source: "builtin",
-			filePath: "<generated>",
-			steps: [{ id: stepId, role, task: "{goal}", model: firstTask?.model }],
-		},
-	};
-}
+import type { AgentConfig } from "../agents/agent-config.ts";
+import type { TeamRunManifest, TeamTaskState } from "../state/types.ts";
+import type { TeamConfig } from "../teams/team-config.ts";
+import type { WorkflowConfig } from "../workflows/workflow-config.ts";
+export function isDirectRun(manifest: Pick<TeamRunManifest, "team" | "workflow">): boolean {
+	return manifest.workflow === "direct-agent";
+}
+export function directTeamAndWorkflowFromRun(manifest: TeamRunManifest, tasks: TeamTaskState[], agents: AgentConfig[]): { team: TeamConfig; workflow: WorkflowConfig } | undefined {
+	if (!isDirectRun(manifest)) return undefined;
+	const firstTask = tasks[0];
+	const agentName = firstTask?.agent ?? (manifest.team.replace(/^direct-/, "") || "executor");
+	const agent = agents.find((candidate) => candidate.name === agentName);
+	const role = firstTask?.role ?? "agent";
+	const stepId = firstTask?.stepId ?? "01_agent";
+	return {
+		team: {
+			name: manifest.team,
+			description: `Direct subagent run for ${agentName}`,
+			source: "builtin",
+			filePath: "<generated>",
+			roles: [{ name: role, agent: agentName, description: agent?.description }],
+			defaultWorkflow: "direct-agent",
+			workspaceMode: manifest.workspaceMode,
+		},
+		workflow: {
+			name: manifest.workflow ?? "direct-agent",
+			description: `Direct task for ${agentName}`,
+			source: "builtin",
+			filePath: "<generated>",
+			steps: [{ id: stepId, role, task: "{goal}", model: firstTask?.model }],
+		},
+	};
+}