npm - pi-crew - Versions diffs - 0.5.2 → 0.5.6 - Mend

pi-crew 0.5.2 → 0.5.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

package/CHANGELOG.md +183 -0
package/README.md +17 -1
package/docs/architecture.md +2 -0
package/docs/bugs/cross-session-notification-leakage.md +82 -0
package/docs/coding-agent-optimization.md +268 -0
package/docs/deep-review-report.md +384 -0
package/docs/distillation/cybersecurity-patterns.md +294 -0
package/docs/migration-v0.4-v0.5.md +208 -0
package/docs/optimization-plan.md +642 -0
package/docs/pi-crew-v0.5.5-audit-fix-plan.md +133 -0
package/docs/pi-mono-opportunities.md +969 -0
package/docs/pi-mono-review.md +291 -0
package/docs/skills/REFERENCE.md +144 -0
package/package.json +12 -9
package/skills/artifact-analysis-loop/SKILL.md +302 -0
package/skills/async-worker-recovery/SKILL.md +19 -1
package/skills/child-pi-spawning/SKILL.md +19 -6
package/skills/context-artifact-hygiene/SKILL.md +19 -2
package/skills/delegation-patterns/SKILL.md +68 -3
package/skills/detection-pipeline-design/SKILL.md +285 -0
package/skills/event-log-tracing/SKILL.md +20 -6
package/skills/git-master/SKILL.md +20 -6
package/skills/hunting-investigation-loop/SKILL.md +401 -0
package/skills/incident-playbook-construction/SKILL.md +383 -0
package/skills/live-agent-lifecycle/SKILL.md +20 -6
package/skills/mailbox-interactive/SKILL.md +19 -6
package/skills/model-routing-context/SKILL.md +19 -1
package/skills/multi-perspective-review/SKILL.md +19 -4
package/skills/observability-reliability/SKILL.md +19 -2
package/skills/orchestration/SKILL.md +20 -2
package/skills/ownership-session-security/SKILL.md +20 -2
package/skills/pi-extension-lifecycle/SKILL.md +20 -2
package/skills/post-mortem/SKILL.md +7 -2
package/skills/read-only-explorer/SKILL.md +20 -6
package/skills/requirements-to-task-packet/SKILL.md +23 -3
package/skills/resource-discovery-config/SKILL.md +20 -2
package/skills/runtime-state-reader/SKILL.md +20 -2
package/skills/safe-bash/SKILL.md +21 -6
package/skills/scrutinize/SKILL.md +20 -2
package/skills/secure-agent-orchestration-review/SKILL.md +29 -2
package/skills/security-review/SKILL.md +560 -0
package/skills/state-mutation-locking/SKILL.md +22 -2
package/skills/systematic-debugging/SKILL.md +8 -6
package/skills/threat-hypothesis-framework/SKILL.md +175 -0
package/skills/ui-render-performance/SKILL.md +20 -2
package/skills/verification-before-done/SKILL.md +17 -2
package/skills/widget-rendering/SKILL.md +21 -6
package/skills/workspace-isolation/SKILL.md +20 -6
package/skills/worktree-isolation/SKILL.md +20 -6
package/src/agents/agent-config.ts +40 -1
package/src/benchmark/benchmark-runner.ts +45 -0
package/src/benchmark/feedback-loop.ts +5 -0
package/src/config/config.ts +32 -5
package/src/config/role-tools.ts +82 -0
package/src/config/suggestions.ts +8 -0
package/src/config/types.ts +4 -0
package/src/extension/async-notifier.ts +10 -1
package/src/extension/crew-cleanup.ts +114 -0
package/src/extension/cross-extension-rpc.ts +1 -1
package/src/extension/notification-router.ts +18 -0
package/src/extension/register.ts +27 -19
package/src/extension/registration/subagent-tools.ts +1 -1
package/src/extension/team-tool/anchor.ts +201 -0
package/src/extension/team-tool/api.ts +2 -1
package/src/extension/team-tool/auto-summarize.ts +154 -0
package/src/extension/team-tool/run.ts +42 -7
package/src/extension/team-tool.ts +44 -2
package/src/hooks/registry.ts +1 -3
package/src/observability/event-bus.ts +69 -0
package/src/observability/event-to-metric.ts +0 -2
package/src/runtime/anchor-manager.ts +473 -0
package/src/runtime/async-runner.ts +8 -4
package/src/runtime/auto-summarize.ts +350 -0
package/src/runtime/background-runner.ts +10 -3
package/src/runtime/budget-tracker.ts +354 -0
package/src/runtime/chain-runner.ts +507 -0
package/src/runtime/child-pi.ts +123 -35
package/src/runtime/crash-recovery.ts +5 -4
package/src/runtime/crew-agent-runtime.ts +1 -0
package/src/runtime/custom-tools/irc-tool.ts +13 -0
package/src/runtime/custom-tools/submit-result-tool.ts +3 -2
package/src/runtime/delivery-coordinator.ts +10 -3
package/src/runtime/dynamic-script-runner.ts +482 -0
package/src/runtime/foreground-control.ts +87 -17
package/src/runtime/handoff-manager.ts +589 -0
package/src/runtime/hidden-handoff.ts +424 -0
package/src/runtime/live-agent-manager.ts +20 -4
package/src/runtime/live-session-runtime.ts +39 -4
package/src/runtime/manifest-cache.ts +2 -1
package/src/runtime/model-resolver.ts +16 -4
package/src/runtime/phase-tracker.ts +373 -0
package/src/runtime/pi-args.ts +11 -1
package/src/runtime/pi-json-output.ts +31 -0
package/src/runtime/pipeline-runner.ts +514 -0
package/src/runtime/progress-tracker.ts +124 -0
package/src/runtime/retry-runner.ts +354 -0
package/src/runtime/sandbox.ts +252 -0
package/src/runtime/scheduler.ts +7 -2
package/src/runtime/skill-effectiveness.ts +473 -0
package/src/runtime/skill-instructions.ts +37 -3
package/src/runtime/subagent-manager.ts +1 -1
package/src/runtime/task-graph.ts +11 -1
package/src/runtime/task-runner.ts +92 -18
package/src/runtime/team-runner.ts +13 -12
package/src/runtime/tool-progress.ts +10 -3
package/src/runtime/verification-gates.ts +367 -0
package/src/schema/team-tool-schema.ts +37 -0
package/src/skills/discover-skills.ts +5 -0
package/src/state/active-run-registry.ts +9 -2
package/src/state/contracts.ts +9 -0
package/src/state/crew-init.ts +3 -3
package/src/state/decision-ledger.ts +98 -55
package/src/state/event-log-rotation.ts +2 -2
package/src/state/event-log.ts +144 -10
package/src/state/hook-instinct-bridge.ts +5 -5
package/src/state/mailbox.ts +10 -0
package/src/state/run-cache.ts +18 -8
package/src/state/state-store.ts +3 -1
package/src/state/types.ts +4 -0
package/src/tools/safe-bash-extension.ts +1 -0
package/src/tools/safe-bash.ts +152 -20
package/src/types/new-api-types.ts +34 -0
package/src/ui/agent-management-overlay.ts +5 -1
package/src/ui/crew-widget.ts +29 -15
package/src/ui/overlays/mailbox-detail-overlay.ts +13 -2
package/src/ui/powerbar-publisher.ts +101 -7
package/src/ui/tool-render.ts +15 -15
package/src/ui/transcript-cache.ts +13 -0
package/src/utils/bm25-search.ts +16 -8
package/src/utils/env-filter.ts +8 -5
package/src/utils/redaction.ts +169 -15
package/src/utils/session-utils.ts +52 -0
package/src/utils/sse-parser.ts +10 -1
package/src/worktree/cleanup.ts +6 -1
package/src/worktree/worktree-manager.ts +32 -13
package/workflows/chain.workflow.md +252 -0
package/workflows/pipeline.workflow.md +27 -0

package/src/runtime/auto-summarize.ts ADDED Viewed

@@ -0,0 +1,350 @@
+/**
+ * AutoSummarizeService - Enables auto-summarization with token/tool thresholds.
+ *
+ * Based on pi-boomerang's autoBoomerang pattern:
+ * - toggle() enables/disables auto-summarization
+ * - shouldAutoSummarize() checks if task should auto-summarize
+ * - Token and tool thresholds control when summarization triggers
+ *
+ * @see docs/pi-boomerang-integration-plan.md
+ */
+import type { TaskPacket, TaskResult } from "./handoff-manager.ts";
+/**
+ * Configuration for AutoSummarizeService.
+ */
+export interface AutoSummarizeConfig {
+	/** Whether auto-summarize is enabled */
+	enabled: boolean;
+	/** Token threshold to trigger summarization */
+	threshold: number;
+	/** Minimum tools used to trigger summarization (default: 5) */
+	minToolsUsed?: number;
+	/** Whether to collapse context after summarization */
+	collapseContext?: boolean;
+}
+/**
+ * Default configuration values.
+ */
+export const DEFAULT_AUTO_SUMMARIZE_CONFIG: Required<Omit<AutoSummarizeConfig, "enabled">> = {
+	threshold: 5000,
+	minToolsUsed: 5,
+	collapseContext: true,
+};
+/**
+ * Options for AutoSummarizeService.
+ */
+export interface AutoSummarizeServiceOptions {
+	/** Initial configuration */
+	config?: Partial<AutoSummarizeConfig>;
+	/** Custom event emitter */
+	eventEmitter?: AutoSummarizeEventEmitter;
+}
+/**
+ * Event emitter for auto-summarize events.
+ */
+export interface AutoSummarizeEventEmitter {
+	emit(event: string, data: unknown): void;
+}
+/**
+ * Event data for auto-summarize toggle event.
+ */
+export interface AutoSummarizeToggledEventData {
+	enabled: boolean;
+	previousEnabled: boolean;
+}
+/**
+ * Event data for auto-summarize triggered event.
+ */
+export interface AutoSummarizeTriggeredEventData {
+	packet: TaskPacket;
+	result: TaskResult;
+	trigger: AutoSummarizeTrigger;
+	tokenCount: number;
+}
+/**
+ * What triggered the auto-summarize.
+ */
+export type AutoSummarizeTrigger =
+	| "token_threshold"
+	| "tools_threshold"
+	| "manual"
+	| "high_usage";
+/**
+ * AutoSummarizeService enables automatic summarization based on configurable thresholds.
+ * When enabled, it monitors task completion and triggers summarization for tasks
+ * that exceed token or tool usage thresholds.
+ */
+export class AutoSummarizeService {
+	private config: AutoSummarizeConfig & Required<Omit<AutoSummarizeConfig, "enabled">>;
+	private eventEmitter: AutoSummarizeEventEmitter | null = null;
+	constructor(options: AutoSummarizeServiceOptions = {}) {
+		this.config = {
+			enabled: options.config?.enabled ?? false,
+			threshold: options.config?.threshold ?? DEFAULT_AUTO_SUMMARIZE_CONFIG.threshold,
+			minToolsUsed: options.config?.minToolsUsed ?? DEFAULT_AUTO_SUMMARIZE_CONFIG.minToolsUsed,
+			collapseContext: options.config?.collapseContext ?? DEFAULT_AUTO_SUMMARIZE_CONFIG.collapseContext,
+		};
+		if (options.eventEmitter) {
+			this.eventEmitter = options.eventEmitter;
+		}
+	}
+	/**
+	 * Check if auto-summarization is currently enabled.
+	 */
+	isEnabled(): boolean {
+		return this.config.enabled;
+	}
+	/**
+	 * Toggle auto-summarize mode.
+	 * Returns the new enabled state.
+	 */
+	toggle(): boolean {
+		const previousEnabled = this.config.enabled;
+		this.config.enabled = !this.config.enabled;
+		this.eventEmitter?.emit("auto-summarize:toggled", {
+			enabled: this.config.enabled,
+			previousEnabled,
+		} as AutoSummarizeToggledEventData);
+		return this.config.enabled;
+	}
+	/**
+	 * Enable auto-summarize.
+	 */
+	enable(): void {
+		if (!this.config.enabled) {
+			this.toggle();
+		}
+	}
+	/**
+	 * Disable auto-summarize.
+	 */
+	disable(): void {
+		if (this.config.enabled) {
+			this.toggle();
+		}
+	}
+	/**
+	 * Check if a task should auto-summarize.
+	 *
+	 * @param packet - The task packet
+	 * @param result - The task result
+	 * @returns True if the task should auto-summarize
+	 */
+	shouldAutoSummarize(packet: TaskPacket, result: TaskResult): boolean {
+		if (!this.config.enabled) {
+			return false;
+		}
+		const tokenCount = result.usage?.totalTokens ?? 0;
+		// Check token threshold
+		if (tokenCount >= this.config.threshold) {
+			return true;
+		}
+		// Check tools threshold
+		const toolsUsed = result.toolsUsed?.length ?? 0;
+		if (toolsUsed >= (this.config.minToolsUsed ?? 5)) {
+			return true;
+		}
+		// High usage check: high token count relative to tools
+		// More tokens per tool suggests complex work that should be summarized
+		if (tokenCount > 2000 && toolsUsed >= 3) {
+			const tokensPerTool = tokenCount / toolsUsed;
+			if (tokensPerTool > 1000) {
+				return true;
+			}
+		}
+		return false;
+	}
+	/**
+	 * Get the reason why a task should (or should not) auto-summarize.
+	 *
+	 * @param packet - The task packet
+	 * @param result - The task result
+	 * @returns Object with shouldSummarize flag and reason
+	 */
+	getAutoSummarizeDecision(packet: TaskPacket, result: TaskResult): AutoSummarizeDecision {
+		if (!this.config.enabled) {
+			return {
+				shouldSummarize: false,
+				reason: "auto-summarize is disabled",
+				trigger: undefined,
+				tokenCount: result.usage?.totalTokens ?? 0,
+				toolsUsed: result.toolsUsed?.length ?? 0,
+			};
+		}
+		const tokenCount = result.usage?.totalTokens ?? 0;
+		const toolsUsed = result.toolsUsed?.length ?? 0;
+		// Check token threshold
+		if (tokenCount >= this.config.threshold) {
+			return {
+				shouldSummarize: true,
+				reason: `Token count ${tokenCount} exceeds threshold ${this.config.threshold}`,
+				trigger: "token_threshold",
+				tokenCount,
+				toolsUsed,
+			};
+		}
+		// Check tools threshold
+		const minTools = this.config.minToolsUsed ?? 5;
+		if (toolsUsed >= minTools) {
+			return {
+				shouldSummarize: true,
+				reason: `Tool count ${toolsUsed} meets minimum ${minTools}`,
+				trigger: "tools_threshold",
+				tokenCount,
+				toolsUsed,
+			};
+		}
+		// High usage check
+		if (tokenCount > 2000 && toolsUsed >= 3) {
+			const tokensPerTool = tokenCount / toolsUsed;
+			if (tokensPerTool > 1000) {
+				return {
+					shouldSummarize: true,
+					reason: `High token-to-tool ratio: ${Math.round(tokensPerTool)} tokens/tool`,
+					trigger: "high_usage",
+					tokenCount,
+					toolsUsed,
+				};
+			}
+		}
+		return {
+			shouldSummarize: false,
+			reason: `Below thresholds (tokens: ${tokenCount}/${this.config.threshold}, tools: ${toolsUsed}/${minTools})`,
+			trigger: undefined,
+			tokenCount,
+			toolsUsed,
+		};
+	}
+	/**
+	 * Get the current configuration.
+	 */
+	getConfig(): AutoSummarizeConfig & Required<Omit<AutoSummarizeConfig, "enabled">> {
+		return { ...this.config };
+	}
+	/**
+	 * Update configuration.
+	 */
+	updateConfig(config: Partial<AutoSummarizeConfig>): void {
+		const previousEnabled = this.config.enabled;
+		if (config.enabled !== undefined) {
+			this.config.enabled = config.enabled;
+		}
+		if (config.threshold !== undefined) {
+			this.config.threshold = config.threshold;
+		}
+		if (config.minToolsUsed !== undefined) {
+			this.config.minToolsUsed = config.minToolsUsed;
+		}
+		if (config.collapseContext !== undefined) {
+			this.config.collapseContext = config.collapseContext;
+		}
+		// Emit event if enabled state changed
+		if (config.enabled !== undefined && config.enabled !== previousEnabled) {
+			this.eventEmitter?.emit("auto-summarize:toggled", {
+				enabled: this.config.enabled,
+				previousEnabled,
+			} as AutoSummarizeToggledEventData);
+		}
+	}
+	/**
+	 * Get current threshold value.
+	 */
+	getThreshold(): number {
+		return this.config.threshold;
+	}
+	/**
+	 * Set token threshold.
+	 */
+	setThreshold(threshold: number): void {
+		if (threshold < 0) {
+			throw new Error("Threshold must be non-negative");
+		}
+		this.config.threshold = threshold;
+	}
+	/**
+	 * Get current minToolsUsed value.
+	 */
+	getMinToolsUsed(): number {
+		return this.config.minToolsUsed ?? 5;
+	}
+	/**
+	 * Set minimum tools threshold.
+	 */
+	setMinToolsUsed(minTools: number): void {
+		if (minTools < 0) {
+			throw new Error("minToolsUsed must be non-negative");
+		}
+		this.config.minToolsUsed = minTools;
+	}
+	/**
+	 * Check if context should be collapsed after summarization.
+	 */
+	shouldCollapseContext(): boolean {
+		return this.config.collapseContext ?? true;
+	}
+	/**
+	 * Set event emitter.
+	 */
+	setEventEmitter(eventEmitter: AutoSummarizeEventEmitter): void {
+		this.eventEmitter = eventEmitter;
+	}
+}
+/**
+ * Decision result from shouldAutoSummarize check.
+ */
+export interface AutoSummarizeDecision {
+	shouldSummarize: boolean;
+	reason: string;
+	trigger: AutoSummarizeTrigger | undefined;
+	tokenCount: number;
+	toolsUsed: number;
+}
+/**
+ * Create an AutoSummarizeService with default options.
+ */
+export function createAutoSummarizeService(
+	options?: AutoSummarizeServiceOptions,
+): AutoSummarizeService {
+	return new AutoSummarizeService(options);
+}

package/src/runtime/background-runner.ts CHANGED Viewed

@@ -24,6 +24,7 @@ import { directTeamAndWorkflowFromRun } from "./direct-run.ts";
 import { expandParallelResearchWorkflow } from "./parallel-research.ts";
 import { writeAsyncStartMarker } from "./async-marker.ts";
 import { startParentGuard, stopParentGuard } from "./parent-guard.ts";
+import { logInternalError } from "../utils/internal-error.ts";
 /**
  * Heartbeat mechanism: periodically write a heartbeat file so the stale reconciler
@@ -127,6 +128,8 @@ function setupUnhandledRejectionGuard(state: { cwd?: string; runId?: string; eve
 }
 async function main(): Promise<void> {
+	// FIX: Store logFd so it can be closed on exit to prevent file descriptor leak
+	let logFd: number | undefined;
 	// Redirect console to background.log since stdio is "ignore" in detached mode.
 	// Must be BEFORE any console.log/console.error calls.
 	const _cwd = argValue("--cwd");
@@ -134,13 +137,17 @@ async function main(): Promise<void> {
 	if (_cwd && _runId) {
 		try {
 			const logPath = path.join(_cwd, ".crew/state/runs", _runId, "background.log");
-			const logFd = fs.openSync(logPath, "a");
+			logFd = fs.openSync(logPath, "a");
 			const origWrite = (prefix: string) => (data: any, ...args: any[]) => {
 				const msg = [data, ...args].map(String).join(" ") + "\n";
-				fs.writeSync(logFd, msg);
+				fs.writeSync(logFd!, msg);
 			};
 			console.log = origWrite("OUT");
 			console.error = origWrite("ERR");
+			// FIX: Close logFd on process exit to prevent file descriptor leak
+			process.on("exit", () => {
+				try { if (logFd !== undefined) fs.closeSync(logFd); } catch { /* ignore */ }
+			});
 		} catch { /* best-effort */ }
 	}
@@ -317,7 +324,7 @@ async function main(): Promise<void> {
 			if (loaded) {
 				// LAZY: live-agent-manager only needed on failure cleanup path; avoid module load at hot path.
 				const { terminateLiveAgentsForRun } = await import("./live-agent-manager.ts");
-				void terminateLiveAgentsForRun(loaded.manifest.runId, "failed", appendEvent, loaded.manifest.eventsPath).catch(() => {});
+				void terminateLiveAgentsForRun(loaded.manifest.runId, "failed", appendEvent, loaded.manifest.eventsPath).catch((error) => logInternalError("background-runner.terminate", error, `runId=${loaded.manifest.runId}`));
 			}
 		} catch { /* best-effort */ }
 		const message = error instanceof Error ? error.message : String(error);