npm - @agwab/pi-workflow - Versions diffs - 0.1.2 → 0.2.1 - Mend

@agwab/pi-workflow 0.1.2 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

package/README.md +9 -13
package/dist/compiler.d.ts +5 -5
package/dist/compiler.js +82 -24
package/dist/dynamic-generated-task-runtime.d.ts +2 -0
package/dist/dynamic-generated-task-runtime.js +21 -8
package/dist/engine.d.ts +6 -5
package/dist/engine.js +39 -54
package/dist/extension.js +211 -24
package/dist/store.d.ts +3 -1
package/dist/store.js +135 -38
package/dist/subagent-backend.d.ts +4 -0
package/dist/subagent-backend.js +128 -4
package/dist/types.d.ts +5 -0
package/dist/workflow-progress-health.d.ts +37 -0
package/dist/workflow-progress-health.js +296 -0
package/dist/workflow-runtime.d.ts +8 -0
package/dist/workflow-runtime.js +63 -10
package/dist/workflow-view.d.ts +2 -0
package/dist/workflow-view.js +97 -18
package/dist/workflow-web-source.js +32 -14
package/docs/usage.md +12 -1
package/package.json +6 -6
package/src/compiler.ts +136 -41
package/src/dynamic-generated-task-runtime.ts +47 -12
package/src/engine.ts +55 -100
package/src/extension.ts +270 -34
package/src/store.ts +180 -44
package/src/subagent-backend.ts +170 -6
package/src/types.ts +10 -0
package/src/workflow-progress-health.ts +461 -0
package/src/workflow-runtime.ts +85 -13
package/src/workflow-view.ts +186 -41
package/src/workflow-web-source.ts +192 -69
package/workflows/deep-research/helpers/claim-evidence-gate.mjs +111 -37
package/workflows/deep-research/helpers/final-audit-packet.mjs +191 -14
package/workflows/deep-research/helpers/normalize-input-packet.mjs +159 -50
package/workflows/deep-research/helpers/render-executive.mjs +671 -37
package/workflows/deep-research/helpers/sanitize-verification-candidates.mjs +624 -0
package/workflows/deep-research/schemas/deep-research-executive-render-control.schema.json +2 -0
package/workflows/deep-research/schemas/deep-research-final-synthesis-control.schema.json +110 -0
package/workflows/deep-research/spec.json +41 -11

package/src/workflow-progress-health.ts ADDED Viewed

@@ -0,0 +1,461 @@
+import type {
+	TaskRunStatus,
+	WorkflowRunRecord,
+	WorkflowRunStatus,
+	WorkflowTaskRunRecord,
+} from "./types.js";
+export type WorkflowHealthState =
+	| "completed"
+	| "pending"
+	| "active"
+	| "long-tail"
+	| "stalled"
+	| "likely-stuck"
+	| "needs-action";
+export type WorkflowHealthTone =
+	| "success"
+	| "accent"
+	| "warning"
+	| "error"
+	| "dim";
+export type WorkflowDurationClass = "short" | "medium" | "long";
+export type WorkflowHealthSuggestion = "wait" | "inspect" | "resume" | "review";
+export interface WorkflowHealthTaskSummary {
+	taskId?: string;
+	displayName?: string;
+	stageId?: string;
+	status?: TaskRunStatus;
+	elapsedMs?: number;
+}
+export interface WorkflowProgressHealth {
+	state: WorkflowHealthState;
+	label: string;
+	summary: string;
+	tone: WorkflowHealthTone;
+	suggestion: WorkflowHealthSuggestion;
+	reason: string;
+	durationClass?: WorkflowDurationClass;
+	currentTask?: WorkflowHealthTaskSummary;
+	lastActivityAt?: string;
+	lastActivityAgeMs?: number;
+	heartbeatAt?: string;
+	heartbeatAgeMs?: number;
+}
+type TaskHealthInput = Pick<
+	WorkflowTaskRunRecord,
+	| "taskId"
+	| "specId"
+	| "displayName"
+	| "status"
+	| "statusDetail"
+	| "stageId"
+	| "kind"
+	| "startedAt"
+	| "lastMessage"
+	| "runtime"
+	| "backendHandle"
+	| "pid"
+>;
+type RunHealthInput = Pick<
+	WorkflowRunRecord,
+	"status" | "taskSummary" | "createdAt" | "updatedAt"
+> & {
+	tasks?: TaskHealthInput[];
+};
+type RunningTaskContext = {
+	task: TaskHealthInput;
+	nowMs: number;
+	durationClass: WorkflowDurationClass;
+	elapsedMs?: number;
+	activityAt?: string;
+	lastActivityAgeMs?: number;
+	heartbeatAt?: string;
+	heartbeatAgeMs?: number;
+	hasBackendSignal: boolean;
+	staleMs: number;
+};
+export interface WorkflowHealthOptions {
+	nowMs?: number;
+}
+const ACTIVE_ACTIVITY_MS = 2 * 60_000;
+const LONG_TAIL_ELAPSED_MS = 8 * 60_000;
+const STALL_BY_DURATION: Record<WorkflowDurationClass, number> = {
+	short: 5 * 60_000,
+	medium: 10 * 60_000,
+	long: 20 * 60_000,
+};
+const STUCK_BY_DURATION: Record<WorkflowDurationClass, number> = {
+	short: 15 * 60_000,
+	medium: 30 * 60_000,
+	long: 60 * 60_000,
+};
+export function diagnoseWorkflowRunHealth(
+	run: RunHealthInput,
+	options: WorkflowHealthOptions = {},
+): WorkflowProgressHealth {
+	const nowMs = options.nowMs ?? Date.now();
+	const runningTask = currentRunningTask(run.tasks ?? []);
+	if (runningTask)
+		return diagnoseWorkflowTaskHealth(runningTask, run, { nowMs });
+	const problem = (run.tasks ?? []).find((task) =>
+		isProblemStatus(task.status),
+	);
+	if (problem) return problemRunHealth(problem, nowMs);
+	if (isProblemStatus(run.status)) return problemWorkflowHealth(run.status);
+	if (run.status === "completed") return completedWorkflowHealth();
+	return waitingWorkflowHealth(run, nowMs);
+}
+export function diagnoseWorkflowTaskHealth(
+	task: TaskHealthInput,
+	run?: Pick<WorkflowRunRecord, "updatedAt">,
+	options: WorkflowHealthOptions = {},
+): WorkflowProgressHealth {
+	const nowMs = options.nowMs ?? Date.now();
+	if (task.status !== "running") return terminalTaskHealth(task, nowMs);
+	return runningTaskHealth(runningContext(task, run, nowMs));
+}
+export function classifyWorkflowTaskDuration(
+	task: Pick<
+		WorkflowTaskRunRecord,
+		"stageId" | "displayName" | "specId" | "kind" | "statusDetail" | "runtime"
+	>,
+): WorkflowDurationClass {
+	const text = [
+		task.stageId,
+		task.displayName,
+		task.specId,
+		task.kind,
+		task.statusDetail,
+	]
+		.filter(Boolean)
+		.join(" ")
+		.toLowerCase();
+	if (/\b(render|helper|support|schema|partition|gate)\b/.test(text))
+		return "short";
+	if (
+		/\b(research|audit|synthesis|review|verify|verifier|normalize|plan|impact|spec)\b/.test(
+			text,
+		)
+	)
+		return "long";
+	const maxRuntimeMs = task.runtime?.maxRuntimeMs;
+	if (maxRuntimeMs !== undefined && Number.isFinite(maxRuntimeMs)) {
+		if (maxRuntimeMs <= 5 * 60_000) return "short";
+		if (maxRuntimeMs >= 60 * 60_000) return "long";
+	}
+	return "medium";
+}
+function currentRunningTask(
+	tasks: TaskHealthInput[],
+): TaskHealthInput | undefined {
+	return tasks
+		.filter((task) => task.status === "running")
+		.sort(
+			(left, right) =>
+				(parseTime(left.startedAt) ?? Number.POSITIVE_INFINITY) -
+				(parseTime(right.startedAt) ?? Number.POSITIVE_INFINITY),
+		)[0];
+}
+function completedWorkflowHealth(): WorkflowProgressHealth {
+	return {
+		state: "completed",
+		label: "completed",
+		summary: "run completed",
+		tone: "success",
+		suggestion: "review",
+		reason: "all tasks reached a terminal successful state",
+	};
+}
+function problemWorkflowHealth(
+	status: WorkflowRunStatus,
+): WorkflowProgressHealth {
+	return {
+		state: "needs-action",
+		label: "needs action",
+		summary: `run ${status}`,
+		tone: "error",
+		suggestion: "inspect",
+		reason: `workflow status is ${status}`,
+	};
+}
+function problemRunHealth(
+	task: TaskHealthInput,
+	nowMs: number,
+): WorkflowProgressHealth {
+	return {
+		state: "needs-action",
+		label: "needs action",
+		summary: `${task.displayName ?? task.taskId ?? "task"} needs attention`,
+		tone: "error",
+		suggestion: "inspect",
+		reason: task.lastMessage ?? task.statusDetail ?? "task did not complete",
+		currentTask: taskSummary(task, nowMs),
+	};
+}
+function waitingWorkflowHealth(
+	run: RunHealthInput,
+	nowMs: number,
+): WorkflowProgressHealth {
+	const hasPending = run.taskSummary.pending > 0;
+	return {
+		state: hasPending ? "pending" : "active",
+		label: hasPending ? "pending" : "active",
+		summary: hasPending
+			? "waiting for the next schedulable task"
+			: "run is active",
+		tone: hasPending ? "dim" : "accent",
+		suggestion: "wait",
+		reason: hasPending
+			? "no task is currently running"
+			: "workflow is still in progress",
+		lastActivityAt: run.updatedAt,
+		lastActivityAgeMs: ageMs(run.updatedAt, nowMs),
+	};
+}
+function runningTaskHealth(
+	context: RunningTaskContext,
+): WorkflowProgressHealth {
+	return (
+		runtimeExceededHealth(context) ??
+		staleRunningHealth(context) ??
+		longTailHealth(context) ??
+		activeRunningHealth(context)
+	);
+}
+function runtimeExceededHealth(
+	context: RunningTaskContext,
+): WorkflowProgressHealth | undefined {
+	const maxRuntimeMs = context.task.runtime?.maxRuntimeMs;
+	const hasElapsed = context.elapsedMs !== undefined;
+	const hasBudget = maxRuntimeMs !== undefined && Number.isFinite(maxRuntimeMs);
+	if (!hasElapsed || !hasBudget) return undefined;
+	if (maxRuntimeMs <= 0 || context.elapsedMs! <= maxRuntimeMs) return undefined;
+	return runningHealth(context, {
+		state: "likely-stuck",
+		label: "runtime exceeded",
+		summary: "task exceeded its runtime budget",
+		tone: "error",
+		suggestion: "resume",
+		reason: "elapsed time is past runtime.maxRuntimeMs",
+	});
+}
+function staleRunningHealth(
+	context: RunningTaskContext,
+): WorkflowProgressHealth | undefined {
+	if (
+		context.staleMs >= STUCK_BY_DURATION[context.durationClass] &&
+		!context.hasBackendSignal
+	) {
+		return runningHealth(context, {
+			state: "likely-stuck",
+			label: "likely stuck",
+			summary: "no fresh backend or activity signal",
+			tone: "error",
+			suggestion: "resume",
+			reason: "running task has no backend signal and activity is stale",
+		});
+	}
+	if (context.staleMs < STALL_BY_DURATION[context.durationClass])
+		return undefined;
+	return runningHealth(context, {
+		state: "stalled",
+		label: "possibly stalled",
+		summary: "no recent visible progress",
+		tone: "warning",
+		suggestion: "inspect",
+		reason: context.hasBackendSignal
+			? "backend signal exists, but activity is stale"
+			: "activity is stale",
+	});
+}
+function longTailHealth(
+	context: RunningTaskContext,
+): WorkflowProgressHealth | undefined {
+	const isLongTail =
+		context.durationClass === "long" &&
+		context.elapsedMs !== undefined &&
+		context.elapsedMs >= LONG_TAIL_ELAPSED_MS;
+	if (!isLongTail) return undefined;
+	return runningHealth(context, {
+		state: "long-tail",
+		label: "long-tail active",
+		summary: "slow task with fresh liveness signals",
+		tone: "accent",
+		suggestion: "wait",
+		reason:
+			context.staleMs <= ACTIVE_ACTIVITY_MS
+				? "liveness signal is fresh"
+				: "long-running stage is still within the stale threshold",
+	});
+}
+function activeRunningHealth(
+	context: RunningTaskContext,
+): WorkflowProgressHealth {
+	return runningHealth(context, {
+		state: "active",
+		label: "active",
+		summary: "task is running",
+		tone: "accent",
+		suggestion: "wait",
+		reason:
+			context.staleMs <= ACTIVE_ACTIVITY_MS
+				? "liveness signal is fresh"
+				: "activity remains within the expected window",
+	});
+}
+function runningContext(
+	task: TaskHealthInput,
+	run: Pick<WorkflowRunRecord, "updatedAt"> | undefined,
+	nowMs: number,
+): RunningTaskContext {
+	const durationClass = classifyWorkflowTaskDuration(task);
+	const startedAtMs = parseTime(task.startedAt);
+	const heartbeatAt = parseHeartbeatAt(task.lastMessage);
+	const activityAt = latestIso([heartbeatAt, run?.updatedAt, task.startedAt]);
+	const lastActivityAgeMs = ageMs(activityAt, nowMs);
+	return {
+		task,
+		nowMs,
+		durationClass,
+		elapsedMs:
+			startedAtMs === undefined ? undefined : Math.max(0, nowMs - startedAtMs),
+		activityAt,
+		lastActivityAgeMs,
+		heartbeatAt,
+		heartbeatAgeMs: ageMs(heartbeatAt, nowMs),
+		hasBackendSignal: Boolean(task.backendHandle || task.pid || heartbeatAt),
+		staleMs: lastActivityAgeMs ?? Number.POSITIVE_INFINITY,
+	};
+}
+function terminalTaskHealth(
+	task: TaskHealthInput,
+	nowMs: number,
+): WorkflowProgressHealth {
+	if (task.status === "completed" || task.status === "skipped") {
+		return {
+			state: "completed",
+			label: task.status === "skipped" ? "skipped" : "completed",
+			summary: task.status === "skipped" ? "task skipped" : "task completed",
+			tone: "success",
+			suggestion: "review",
+			reason: task.statusDetail,
+			currentTask: taskSummary(task, nowMs),
+		};
+	}
+	if (task.status === "pending") {
+		return {
+			state: "pending",
+			label: "pending",
+			summary: "waiting for dependencies or scheduler",
+			tone: "dim",
+			suggestion: "wait",
+			reason: task.statusDetail,
+			currentTask: taskSummary(task, nowMs),
+		};
+	}
+	return {
+		state: "needs-action",
+		label: "needs action",
+		summary: `${task.status} task needs attention`,
+		tone: "error",
+		suggestion: "inspect",
+		reason: task.lastMessage ?? task.statusDetail,
+		currentTask: taskSummary(task, nowMs),
+	};
+}
+function runningHealth(
+	context: RunningTaskContext,
+	health: Pick<
+		WorkflowProgressHealth,
+		"state" | "label" | "summary" | "tone" | "suggestion" | "reason"
+	>,
+): WorkflowProgressHealth {
+	return {
+		...health,
+		durationClass: context.durationClass,
+		currentTask: taskSummary(context.task, context.nowMs),
+		lastActivityAt: context.activityAt,
+		lastActivityAgeMs: context.lastActivityAgeMs,
+		heartbeatAt: context.heartbeatAt,
+		heartbeatAgeMs: context.heartbeatAgeMs,
+	};
+}
+function taskSummary(
+	task: TaskHealthInput,
+	nowMs: number,
+): WorkflowHealthTaskSummary {
+	const startedAtMs = parseTime(task.startedAt);
+	return {
+		taskId: task.taskId,
+		displayName: task.displayName,
+		stageId: task.stageId,
+		status: task.status,
+		...(startedAtMs === undefined
+			? {}
+			: { elapsedMs: Math.max(0, nowMs - startedAtMs) }),
+	};
+}
+function isProblemStatus(status: TaskRunStatus | WorkflowRunStatus): boolean {
+	return (
+		status === "failed" || status === "blocked" || status === "interrupted"
+	);
+}
+function parseHeartbeatAt(message: string | undefined): string | undefined {
+	if (!message) return undefined;
+	const match = /heartbeat\s+(\d{4}-\d{2}-\d{2}T\S+?Z)/i.exec(message);
+	if (!match) return undefined;
+	const value = match[1];
+	return parseTime(value) === undefined ? undefined : value;
+}
+function latestIso(values: Array<string | undefined>): string | undefined {
+	let latest: string | undefined;
+	let latestMs = Number.NEGATIVE_INFINITY;
+	for (const value of values) {
+		const time = parseTime(value);
+		if (time === undefined || time <= latestMs) continue;
+		latest = value;
+		latestMs = time;
+	}
+	return latest;
+}
+function ageMs(value: string | undefined, nowMs: number): number | undefined {
+	const time = parseTime(value);
+	return time === undefined ? undefined : Math.max(0, nowMs - time);
+}
+function parseTime(value: string | undefined): number | undefined {
+	if (!value) return undefined;
+	const parsed = Date.parse(value);
+	return Number.isFinite(parsed) ? parsed : undefined;
+}

package/src/workflow-runtime.ts CHANGED Viewed

@@ -17,9 +17,16 @@ export interface WorkflowRuntimeDefaults {
 	thinking?: ThinkingLevel;
 }
+export interface WorkflowRuntimeThinkingResolution {
+	requested?: ThinkingLevel;
+	resolved?: ThinkingLevel;
+	reason?: string;
+}
 export interface WorkflowRuntimeResolutionInput {
 	model?: string;
 	thinking?: ThinkingLevel;
+	thinkingResolution?: WorkflowRuntimeThinkingResolution;
 }
 export interface WorkflowRuntimeResolutionContext {
@@ -39,6 +46,41 @@ export interface ResolveWorkflowRuntimeOptions {
 	prompt?: WorkflowRuntimePrompt;
 }
+export type WorkflowRuntimeLayer = WorkflowRuntimeDefaults | undefined;
+export function selectWorkflowRuntime(
+	...layers: WorkflowRuntimeLayer[]
+): WorkflowRuntimeResolutionInput {
+	const modelLayer = layers.find((layer) => modelOf(layer));
+	const model = modelOf(modelLayer);
+	let thinking: ThinkingLevel | undefined;
+	for (const layer of layers) {
+		if (!layer) continue;
+		if (layer.thinking) {
+			thinking = layer.thinking;
+			break;
+		}
+		const layerModel = modelOf(layer);
+		const modelThinking = layerModel
+			? splitKnownThinkingSuffix(layerModel).thinking
+			: undefined;
+		if (modelThinking) {
+			thinking = modelThinking;
+			break;
+		}
+	}
+	return {
+		...(model ? { model } : {}),
+		...(thinking ? { thinking } : {}),
+	};
+}
+function modelOf(layer: WorkflowRuntimeLayer): string | undefined {
+	return typeof layer?.model === "string" && layer.model.trim()
+		? layer.model.trim()
+		: undefined;
+}
 export function toWorkflowModelInfo(model: {
 	provider: string;
 	id: string;
@@ -66,7 +108,7 @@ export async function resolveWorkflowRuntime(
 	const model = await resolveModel(baseModel, context, options);
 	const effectiveThinking =
 		runtime.thinking ?? thinking ?? options.defaults?.thinking;
-	const resolvedThinking = await resolveThinking(
+	const thinkingResolution = await resolveThinking(
 		model,
 		effectiveThinking,
 		context,
@@ -74,7 +116,10 @@ export async function resolveWorkflowRuntime(
 	);
 	return {
 		...(model ? { model } : {}),
-		...(resolvedThinking ? { thinking: resolvedThinking } : {}),
+		...(thinkingResolution?.resolved
+			? { thinking: thinkingResolution.resolved }
+			: {}),
+		...(thinkingResolution ? { thinkingResolution } : {}),
 	};
 }
@@ -208,36 +253,63 @@ async function resolveThinking(
 	requested: ThinkingLevel | undefined,
 	context: WorkflowRuntimeResolutionContext,
 	options: ResolveWorkflowRuntimeOptions,
-): Promise<ThinkingLevel | undefined> {
+): Promise<WorkflowRuntimeThinkingResolution | undefined> {
 	if (!requested) return undefined;
 	const model = findModelInfo(modelId, options.availableModels ?? []);
 	const supported = getSupportedThinkingLevels(model);
-	if (supported.includes(requested)) return requested;
+	if (supported.includes(requested)) {
+		return { requested, resolved: requested };
+	}
-	if (!options.prompt) {
-		const modelLabel = modelId ?? "selected model";
+	if (supported.length === 0) {
 		throw new Error(
-			`${modelLabel} does not support reasoning level "${requested}" for ${context.taskKey}. Supported: ${supported.join(", ") || "none"}`,
+			`${modelId ?? "selected model"} does not expose any supported reasoning levels for ${context.taskKey}`,
 		);
 	}
-	if (supported.length === 0) {
+	const downgradeOptions = lowerOrEqualSupportedThinking(requested, supported);
+	if (downgradeOptions.length === 0) {
+		const modelLabel = modelId ?? "selected model";
 		throw new Error(
-			`${modelId ?? "selected model"} does not expose any supported reasoning levels for ${context.taskKey}`,
+			`${modelLabel} does not support reasoning level "${requested}" for ${context.taskKey}, and no lower-or-equal fallback is available. Supported: ${supported.join(", ") || "none"}`,
 		);
 	}
+	if (!options.prompt) {
+		const resolved = downgradeOptions[downgradeOptions.length - 1]!;
+		return {
+			requested,
+			resolved,
+			reason: `requested ${requested} is unsupported by ${modelId ?? "selected model"}; using ${resolved}`,
+		};
+	}
 	const selected = await options.prompt.select(
-		`${modelId ?? "Selected model"} does not support reasoning "${requested}" for ${context.taskKey}. Choose a supported level.`,
-		supported,
+		`${modelId ?? "Selected model"} does not support reasoning "${requested}" for ${context.taskKey}. Choose a supported lower-or-equal level.`,
+		downgradeOptions,
 	);
 	if (!selected)
 		throw new Error(`Reasoning selection cancelled for ${context.taskKey}`);
-	if (!isThinkingLevel(selected))
+	if (!isThinkingLevel(selected) || !downgradeOptions.includes(selected))
 		throw new Error(
 			`Invalid reasoning selection "${selected}" for ${context.taskKey}`,
 		);
-	return selected;
+	return {
+		requested,
+		resolved: selected,
+		reason: `selected supported reasoning ${selected} for unsupported request ${requested}`,
+	};
+}
+function lowerOrEqualSupportedThinking(
+	requested: ThinkingLevel,
+	supported: ThinkingLevel[],
+): ThinkingLevel[] {
+	const requestedIndex = THINKING_LEVELS.indexOf(requested);
+	if (requestedIndex < 0) return [];
+	return THINKING_LEVELS.slice(0, requestedIndex + 1).filter((level) =>
+		supported.includes(level),
+	);
 }
 function findModelInfo(