npm - @agwab/pi-workflow - Versions diffs - 0.1.2 → 0.2.1 - Mend

@agwab/pi-workflow 0.1.2 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

package/README.md +9 -13
package/dist/compiler.d.ts +5 -5
package/dist/compiler.js +82 -24
package/dist/dynamic-generated-task-runtime.d.ts +2 -0
package/dist/dynamic-generated-task-runtime.js +21 -8
package/dist/engine.d.ts +6 -5
package/dist/engine.js +39 -54
package/dist/extension.js +211 -24
package/dist/store.d.ts +3 -1
package/dist/store.js +135 -38
package/dist/subagent-backend.d.ts +4 -0
package/dist/subagent-backend.js +128 -4
package/dist/types.d.ts +5 -0
package/dist/workflow-progress-health.d.ts +37 -0
package/dist/workflow-progress-health.js +296 -0
package/dist/workflow-runtime.d.ts +8 -0
package/dist/workflow-runtime.js +63 -10
package/dist/workflow-view.d.ts +2 -0
package/dist/workflow-view.js +97 -18
package/dist/workflow-web-source.js +32 -14
package/docs/usage.md +12 -1
package/package.json +6 -6
package/src/compiler.ts +136 -41
package/src/dynamic-generated-task-runtime.ts +47 -12
package/src/engine.ts +55 -100
package/src/extension.ts +270 -34
package/src/store.ts +180 -44
package/src/subagent-backend.ts +170 -6
package/src/types.ts +10 -0
package/src/workflow-progress-health.ts +461 -0
package/src/workflow-runtime.ts +85 -13
package/src/workflow-view.ts +186 -41
package/src/workflow-web-source.ts +192 -69
package/workflows/deep-research/helpers/claim-evidence-gate.mjs +111 -37
package/workflows/deep-research/helpers/final-audit-packet.mjs +191 -14
package/workflows/deep-research/helpers/normalize-input-packet.mjs +159 -50
package/workflows/deep-research/helpers/render-executive.mjs +671 -37
package/workflows/deep-research/helpers/sanitize-verification-candidates.mjs +624 -0
package/workflows/deep-research/schemas/deep-research-executive-render-control.schema.json +2 -0
package/workflows/deep-research/schemas/deep-research-final-synthesis-control.schema.json +110 -0
package/workflows/deep-research/spec.json +41 -11

package/src/subagent-backend.ts CHANGED Viewed

@@ -17,6 +17,7 @@ import {
 	resolve,
 	sep,
 } from "node:path";
+import { availableParallelism } from "node:os";
 import { fileURLToPath } from "node:url";
 import type {
@@ -55,6 +56,10 @@ const FETCH_CONTENT_CACHE_ENV = "PI_WORKFLOW_FETCH_CONTENT_CACHE";
 const LEGACY_FETCH_CACHE_ENV = "PI_WORKFLOW_FETCH_CACHE";
 const DEFAULT_TRANSIENT_MODEL_FAILURE_RETRIES = 5;
 const DEFAULT_ARTIFACT_OUTPUT_RETRIES = 2;
+const MAX_CONCURRENT_LAUNCHES_ENV = "PI_WORKFLOW_MAX_CONCURRENT_LAUNCHES";
+const DEFAULT_LAUNCH_SLOT_RELEASE_DELAY_MS = 3_000;
+const MIN_TRANSIENT_RETRY_JITTER_MS = 1_000;
+const MAX_TRANSIENT_RETRY_JITTER_MS = 5_000;
 const MODULE_PATH = fileURLToPath(import.meta.url);
 const MODULE_DIR = dirname(MODULE_PATH);
 const BUNDLED_PI_WEB_ACCESS_EXTENSION = bundledNodeModulePath(
@@ -175,6 +180,103 @@ async function loadSubagentApi(): Promise<SubagentApi> {
 	return cachedSubagentApi;
 }
+let launchSlotReleaseDelayMs = DEFAULT_LAUNCH_SLOT_RELEASE_DELAY_MS;
+let transientRetryJitterForTests: (() => number) | undefined;
+const launchWaitQueue: Array<() => void> = [];
+let activeLaunchSlots = 0;
+function resolveMaxConcurrentLaunches(): number {
+	const override = Number.parseInt(
+		process.env[MAX_CONCURRENT_LAUNCHES_ENV] ?? "",
+		10,
+	);
+	if (Number.isFinite(override)) return Math.max(1, Math.floor(override));
+	return Math.max(2, Math.floor(availableParallelism() / 2));
+}
+function isLaunchGateSaturated(): boolean {
+	return activeLaunchSlots >= resolveMaxConcurrentLaunches();
+}
+async function acquireLaunchSlot(): Promise<() => void> {
+	if (!isLaunchGateSaturated()) {
+		activeLaunchSlots += 1;
+		return releaseLaunchSlot;
+	}
+	await new Promise<void>((resolveWait) => launchWaitQueue.push(resolveWait));
+	return releaseLaunchSlot;
+}
+function releaseLaunchSlot(): void {
+	const next = launchWaitQueue.shift();
+	if (next) {
+		// Transfer the occupied slot directly to the queued launcher.
+		next();
+		return;
+	}
+	activeLaunchSlots = Math.max(0, activeLaunchSlots - 1);
+}
+function releaseLaunchSlotAfterDelay(
+	delayMs: number,
+	release: () => void,
+): void {
+	if (delayMs <= 0) {
+		release();
+		return;
+	}
+	const timer = setTimeout(release, delayMs);
+	timer.unref?.();
+}
+async function runWithLaunchSlot<T>(action: () => Promise<T>): Promise<T> {
+	const release = await acquireLaunchSlot();
+	let holdAfterReturn = false;
+	try {
+		const result = await action();
+		holdAfterReturn = true;
+		return result;
+	} finally {
+		releaseLaunchSlotAfterDelay(
+			holdAfterReturn ? launchSlotReleaseDelayMs : 0,
+			release,
+		);
+	}
+}
+function transientRetryJitterMs(): number {
+	if (transientRetryJitterForTests) return transientRetryJitterForTests();
+	return (
+		MIN_TRANSIENT_RETRY_JITTER_MS +
+		Math.floor(
+			Math.random() *
+				(MAX_TRANSIENT_RETRY_JITTER_MS - MIN_TRANSIENT_RETRY_JITTER_MS + 1),
+		)
+	);
+}
+function sleep(ms: number): Promise<void> {
+	return new Promise((resolve) => setTimeout(resolve, ms));
+}
+export function setSubagentLaunchControlsForTests(options?: {
+	releaseDelayMs?: number;
+	retryJitterMs?: number | (() => number);
+}): void {
+	launchSlotReleaseDelayMs =
+		options?.releaseDelayMs === undefined
+			? DEFAULT_LAUNCH_SLOT_RELEASE_DELAY_MS
+			: Math.max(0, Math.floor(options.releaseDelayMs));
+	transientRetryJitterForTests =
+		options?.retryJitterMs === undefined
+			? undefined
+			: typeof options.retryJitterMs === "function"
+				? options.retryJitterMs
+				: () => Math.max(0, Math.floor(options.retryJitterMs as number));
+	activeLaunchSlots = 0;
+	while (launchWaitQueue.length > 0) launchWaitQueue.shift()?.();
+}
 export async function cleanupSubagentRun(
 	_cwd: string,
 	run: WorkflowRunRecord,
@@ -212,6 +314,14 @@ export async function launchSubagentTask(
 		};
 	}
+	if ((task.launchRetry?.attempts ?? 0) > 0) {
+		const jitterMs = transientRetryJitterMs();
+		task.statusDetail = "retry_model_failure";
+		task.lastMessage = `waiting ${jitterMs}ms before retrying transient-model launch`;
+		await writeRunRecord(cwd, run);
+		if (jitterMs > 0) await sleep(jitterMs);
+	}
 	const systemPromptFile = fromProjectPath(cwd, task.files.systemPrompt);
 	const taskPromptFile = fromProjectPath(cwd, task.files.taskPrompt);
 	const outputFile = fromProjectPath(cwd, task.files.output);
@@ -267,7 +377,11 @@ export async function launchSubagentTask(
 		};
 		subagentOptions.extensions = extensions;
 		if (captureToolCallsEnabled()) subagentOptions.captureToolCalls = true;
-		launched = await api.runSubagent(subagentOptions);
+		if (isLaunchGateSaturated()) {
+			task.lastMessage = `waiting for pi-subagent launch slot (${resolveMaxConcurrentLaunches()} max)`;
+			await writeRunRecord(cwd, run).catch(() => undefined);
+		}
+		launched = await runWithLaunchSlot(() => api.runSubagent(subagentOptions));
 	} catch (error) {
 		task.status = "pending";
 		task.statusDetail = "pending";
@@ -432,12 +546,29 @@ async function materializeTerminalSubagentResult(
 		artifactRoot,
 	);
 	const outputText = await readFile(outputFile, "utf8").catch(() => "");
+	const stderrText = await readFile(stderrFile, "utf8").catch(() => "");
 	const outputBytes = Buffer.byteLength(outputText, "utf8");
-	const statusInfo = workflowStatusFromSubagent(
+	let statusInfo = workflowStatusFromSubagent(
 		snapshot,
 		subagentResult,
 		outputBytes,
 	);
+	const deterministicBootFailure = classifyDeterministicBootFailure({
+		statusInfo,
+		stderrText,
+		outputBytes,
+		contextLengthExceeded: Boolean(
+			(subagentResult?.metadata as any)?.contextLengthExceeded ??
+				snapshot.metadata?.contextLengthExceeded,
+		),
+	});
+	if (deterministicBootFailure) {
+		statusInfo = {
+			status: "failed",
+			failureKind: "deterministic_boot",
+			errorMessage: deterministicBootFailure,
+		};
+	}
 	const completedAt =
 		typeof subagentResult?.completedAt === "string"
 			? subagentResult.completedAt
@@ -1005,6 +1136,36 @@ function failArtifactGraphTask(
 	return true;
 }
+function classifyDeterministicBootFailure(options: {
+	statusInfo: {
+		status: WorkflowTaskRunRecord["status"];
+		failureKind?: string;
+		errorMessage?: string;
+	};
+	stderrText: string;
+	outputBytes: number;
+	contextLengthExceeded: boolean;
+}): string | undefined {
+	if (
+		options.statusInfo.status !== "failed" ||
+		options.statusInfo.failureKind !== "model" ||
+		options.outputBytes !== 0 ||
+		options.contextLengthExceeded
+	) {
+		return undefined;
+	}
+	const text = options.stderrText;
+	const deterministicPattern =
+		/(Failed to load extension|Cannot find module|(?:failed to load|invalid|missing) (?:workflow )?config(?:uration)?|config(?:uration)? (?:error|failed|invalid))/i;
+	if (!deterministicPattern.test(text)) return undefined;
+	const excerpt =
+		text
+			.split(/\r?\n/)
+			.map((line) => line.trim())
+			.find((line) => deterministicPattern.test(line)) ?? text.trim();
+	return `deterministic-boot failure: ${excerpt.slice(0, 500)}`;
+}
 function shouldRetryTransientModelFailure(
 	statusInfo: {
 		status: WorkflowTaskRunRecord["status"];
@@ -1056,14 +1217,14 @@ function retryOrFailTransientSubagentFailure(
 	if (!exhausted) {
 		task.status = "pending";
 		task.statusDetail = "retry_model_failure";
-		task.lastMessage = `${options.message}; retrying transient model failure (${attempt}/${maxAttempts})`;
+		task.lastMessage = `${options.message}; retrying transient-model failure (${attempt}/${maxAttempts})`;
 		return true;
 	}
 	task.status = "failed";
 	task.statusDetail = task.launchRetry.reason ?? "model_exhausted";
 	task.exitCode = 1;
 	task.completedAt = nowIso();
-	task.lastMessage = `${options.message}; transient model failure retries exhausted (${maxAttempts})`;
+	task.lastMessage = `${options.message}; transient-model failure retries exhausted (${maxAttempts})`;
 	return true;
 }
@@ -1317,7 +1478,10 @@ async function workflowTaskExtensions(
 			},
 		});
 		const capturedProviderExtensions = new Set(
-			workflowWebSourceProviderExtensions(tools, compiledTask.runtime.toolProviders),
+			workflowWebSourceProviderExtensions(
+				tools,
+				compiledTask.runtime.toolProviders,
+			),
 		);
 		extensions = uniqueStrings([
 			...extensions.filter(
@@ -1673,7 +1837,7 @@ function buildSystemPrompt(task: CompiledTask): string {
 		enabledTools.includes("workflow_web_source_read")
 			? "Workflow web-source tools return compact source cards. Preserve sourceRef values in structured outputs. Use workflow_web_source_read for exact evidence snippets; when several snippets are needed from the same sourceRef, batch them with queries:[...] or reads:[...] instead of making repeated calls. If the exact quote is unknown, pass claim plus 2-6 distinctive terms to harvest a candidate source window and preserve its match metadata. Do not read workflow cache files directly."
 			: !enabledTools.includes("get_search_content") &&
-				  (enabledTools.includes("web_search") ||
+					(enabledTools.includes("web_search") ||
 						enabledTools.includes("fetch_content"))
 				? "Full cached search-content hydration is unavailable here. Use web_search/fetch_content results and report evidence gaps instead of broad raw document retrieval."
 				: undefined,

package/src/types.ts CHANGED Viewed

@@ -1,3 +1,9 @@
+import type {
+	WorkflowModelInfo,
+	WorkflowRuntimeDefaults,
+	WorkflowRuntimeThinkingResolution,
+} from "./workflow-runtime.js";
 export const THINKING_LEVELS = [
 	"off",
 	"minimal",
@@ -284,6 +290,7 @@ export interface PermissionPreview {
 export interface CompiledTaskRuntime {
 	model?: string;
 	thinking?: ThinkingLevel;
+	thinkingResolution?: WorkflowRuntimeThinkingResolution;
 	fast?: FastMode;
 	approvalMode: ApprovalMode;
 	tools?: string[];
@@ -469,6 +476,8 @@ export interface CompiledDynamicWorkflowTask {
 	helpers: Record<string, CompiledDynamicWorkflowHelper>;
 	workflows: Record<string, CompiledDynamicNestedWorkflow>;
 	decisionLoop?: CompiledDynamicDecisionLoop;
+	runtimeOverrides?: WorkflowRuntimeDefaults;
+	availableModels?: WorkflowModelInfo[];
 }
 export interface CompiledArtifactGraphTask {
@@ -572,6 +581,7 @@ export interface WorkflowTaskRunRecord {
 	runtime: {
 		model?: string;
 		thinking?: ThinkingLevel;
+		thinkingResolution?: WorkflowRuntimeThinkingResolution;
 		fast?: FastMode;
 		approvalMode: ApprovalMode;
 		maxRuntimeMs?: number;