npm - @agwab/pi-workflow - Versions diffs - 0.2.1 → 0.4.0 - Mend

@agwab/pi-workflow 0.2.1 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

package/README.md +3 -1
package/dist/artifact-graph-runtime.d.ts +1 -1
package/dist/artifact-graph-runtime.js +10 -5
package/dist/artifact-graph-schema.js +127 -5
package/dist/compiler.js +52 -19
package/dist/dynamic-generated-task-runtime.js +3 -1
package/dist/dynamic-profiles.d.ts +1 -1
package/dist/engine-run-graph.d.ts +3 -0
package/dist/engine-run-graph.js +194 -4
package/dist/engine.d.ts +5 -0
package/dist/engine.js +389 -41
package/dist/extension.d.ts +2 -1
package/dist/extension.js +30 -8
package/dist/index.d.ts +11 -3
package/dist/index.js +6 -1
package/dist/prompt-json.d.ts +7 -0
package/dist/prompt-json.js +13 -0
package/dist/roles.d.ts +1 -1
package/dist/roles.js +5 -8
package/dist/store.d.ts +20 -1
package/dist/store.js +139 -35
package/dist/strings.d.ts +11 -0
package/dist/strings.js +24 -0
package/dist/subagent-backend.js +710 -40
package/dist/types.d.ts +107 -1
package/dist/verification-ontology.d.ts +31 -0
package/dist/verification-ontology.js +66 -0
package/dist/workflow-artifact-tool.js +5 -6
package/dist/workflow-artifacts.d.ts +7 -0
package/dist/workflow-artifacts.js +55 -4
package/dist/workflow-fetch-cache-extension.d.ts +1 -0
package/dist/workflow-fetch-cache-extension.js +57 -9
package/dist/workflow-metrics.d.ts +113 -0
package/dist/workflow-metrics.js +272 -0
package/dist/workflow-output-artifacts.js +5 -3
package/dist/workflow-partial-output.d.ts +45 -0
package/dist/workflow-partial-output.js +205 -0
package/dist/workflow-progress-health.js +42 -10
package/dist/workflow-runtime.js +10 -1
package/dist/workflow-view.js +3 -1
package/dist/workflow-web-source-extension.js +194 -52
package/dist/workflow-web-source.d.ts +2 -1
package/dist/workflow-web-source.js +109 -30
package/docs/usage.md +76 -29
package/node_modules/@agwab/pi-subagent/README.md +3 -3
package/node_modules/@agwab/pi-subagent/api.mjs +1 -0
package/node_modules/@agwab/pi-subagent/docs/usage.md +63 -12
package/node_modules/@agwab/pi-subagent/package.json +2 -2
package/node_modules/@agwab/pi-subagent/src/api.ts +54 -1
package/node_modules/@agwab/pi-subagent/src/artifacts/registry.ts +9 -4
package/node_modules/@agwab/pi-subagent/src/artifacts/result.ts +8 -0
package/node_modules/@agwab/pi-subagent/src/core/constants.ts +9 -0
package/node_modules/@agwab/pi-subagent/src/core/validation.ts +21 -0
package/node_modules/@agwab/pi-subagent/src/index.ts +1046 -576
package/node_modules/@agwab/pi-subagent/src/orchestrate/async.ts +279 -156
package/node_modules/@agwab/pi-subagent/src/orchestrate/interrupt.ts +165 -89
package/node_modules/@agwab/pi-subagent/src/orchestrate/reconcile.ts +111 -65
package/node_modules/@agwab/pi-subagent/src/orchestrate/run-ref.ts +219 -0
package/node_modules/@agwab/pi-subagent/src/orchestrate/run.ts +88 -8
package/node_modules/@agwab/pi-subagent/src/orchestrate/status.ts +614 -298
package/node_modules/@agwab/pi-subagent/src/panel.ts +1356 -560
package/node_modules/@agwab/pi-subagent/src/runners/headless-model.ts +53 -5
package/node_modules/@agwab/pi-subagent/src/runners/tmux.ts +13 -6
package/package.json +2 -2
package/skills/workflow-guide/SKILL.md +1 -0
package/src/artifact-graph-runtime.ts +19 -13
package/src/artifact-graph-schema.ts +143 -3
package/src/cli.mjs +52 -0
package/src/compiler.ts +63 -18
package/src/dynamic-generated-task-runtime.ts +3 -1
package/src/dynamic-profiles.ts +1 -1
package/src/engine-run-graph.ts +246 -4
package/src/engine.ts +545 -38
package/src/extension.ts +36 -6
package/src/index.ts +52 -1
package/src/prompt-json.ts +13 -0
package/src/roles.ts +6 -9
package/src/store.ts +194 -42
package/src/strings.ts +38 -0
package/src/subagent-backend.ts +921 -62
package/src/types.ts +116 -2
package/src/verification-ontology.ts +88 -0
package/src/workflow-artifact-tool.ts +5 -7
package/src/workflow-artifacts.ts +83 -3
package/src/workflow-fetch-cache-extension.ts +78 -13
package/src/workflow-metrics.ts +478 -0
package/src/workflow-output-artifacts.ts +5 -3
package/src/workflow-partial-output.ts +299 -0
package/src/workflow-progress-health.ts +47 -15
package/src/workflow-runtime.ts +18 -2
package/src/workflow-view.ts +2 -1
package/src/workflow-web-source-extension.ts +654 -232
package/src/workflow-web-source.ts +153 -39
package/workflows/README.md +7 -25
package/workflows/deep-research/batched-verification.spec.json +253 -0
package/workflows/deep-research/helpers/batch-verification-candidates.mjs +136 -0
package/workflows/deep-research/helpers/claim-evidence-gate.mjs +229 -36
package/workflows/deep-research/helpers/final-audit-packet.mjs +1 -4
package/workflows/deep-research/helpers/normalize-input-packet.mjs +81 -2
package/workflows/deep-research/helpers/render-executive.mjs +40 -26
package/workflows/deep-research/helpers/sanitize-verification-candidates.mjs +89 -15
package/workflows/deep-research/helpers/shadow-select-verification.mjs +229 -0
package/workflows/deep-research/helpers/verification-ontology.mjs +77 -0
package/workflows/deep-research/schemas/deep-research-executive-render-control.schema.json +3 -3
package/workflows/deep-research/schemas/deep-research-research-questions-control.schema.json +38 -0
package/workflows/deep-research/schemas/deep-research-sanitize-claims-control.schema.json +63 -0
package/workflows/deep-research/schemas/deep-research-verify-claims-batch-control.schema.json +47 -0
package/workflows/deep-research/schemas/deep-research-verify-claims-control.schema.json +13 -3
package/workflows/deep-research/spec.json +32 -12
package/workflows/impact-review/spec.json +3 -3
package/workflows/spec-review/helpers/spec-review-pipeline.mjs +1 -8
package/dist/dynamic-loader.d.ts +0 -25
package/dist/dynamic-loader.js +0 -13
package/skills/workflow-guide/scaffolds/dag-required-reads/spec.json.validate.stderr +0 -0
package/skills/workflow-guide/scaffolds/dag-required-reads/spec.json.validate.stdout +0 -13
package/src/dynamic-loader.ts +0 -49
package/workflows/impact-review/schemas/docs-release-impact-control.schema.json +0 -42
package/workflows/impact-review/schemas/security-performance-impact-control.schema.json +0 -42
package/workflows/impact-review/schemas/state-data-impact-control.schema.json +0 -42

package/src/types.ts CHANGED Viewed

@@ -203,7 +203,14 @@ export interface ArtifactGraphStageSpec {
 	maxRuntimeMs?: number;
 	maxConcurrency?: number;
 	maxItems?: number;
-	from?: string | string[] | { source: string; path: string };
+	from?:
+		| string
+		| string[]
+		| {
+				source: string;
+				path: string;
+				streaming?: { enabled: true; minChunk?: number };
+		  };
 	after?: string | string[];
 	sourcePolicy?: "success" | "partial" | "require-success";
 	sourceProjection?: {
@@ -213,12 +220,14 @@ export interface ArtifactGraphStageSpec {
 	inputPolicy?: {
 		requiredReads?: string[];
 		enforcement?: "fail";
+		artifactAccess?: "enabled" | "none";
 	};
 	output?: {
 		controlSchema?: string;
 		analysis?: { required?: boolean };
 		refs?: { required?: boolean; minItems?: number };
 		maxDigestChars?: number;
+		partial?: { paths: string[] };
 	};
 	each?: Record<string, unknown>;
 	stages?: ArtifactGraphStageSpec[];
@@ -490,8 +499,10 @@ export interface CompiledArtifactGraphTask {
 		controlSchema?: string;
 		controlSchemaPath?: string;
 		maxDigestChars?: number;
+		partial?: { paths: string[] };
 	};
 	requiredReads: string[];
+	artifactAccess: "enabled" | "none";
 	sourceProjection?: {
 		include?: string[];
 		maxChars?: number;
@@ -542,6 +553,13 @@ export interface CompiledTask {
 		branchId?: string;
 		outputProfile?: string;
 	};
+	foreachGenerated?: {
+		placeholderSpecId: string;
+		itemHash?: string;
+		itemSourceSpecId?: string;
+		itemSourceKind?: "control" | "partial";
+		itemRef?: string;
+	};
 	loopChild?: CompiledLoopChildTaskRef;
 	loopPlaceholder?: {
 		loopId: string;
@@ -568,6 +586,89 @@ export type WorkflowRunStatus =
 	| "failed"
 	| "interrupted";
+export interface WorkflowTaskUsageValues {
+	inputTokens?: number | null;
+	outputTokens?: number | null;
+	totalTokens?: number | null;
+	cachedInputTokens?: number | null;
+	cacheCreationInputTokens?: number | null;
+	cacheReadInputTokens?: number | null;
+	reasoningTokens?: number | null;
+	costUsd?: number | null;
+}
+export interface WorkflowTaskUsageAttemptRecord
+	extends WorkflowTaskUsageValues {
+	source: string;
+	capturedAt: string;
+	provider?: string;
+	model?: string;
+	thinking?: ThinkingLevel | string;
+	backendRunId?: string;
+	backendAttemptId?: string;
+	unavailable?: true;
+	raw?: unknown;
+}
+export interface WorkflowTaskUsageAggregateRecord
+	extends WorkflowTaskUsageValues {
+	attempts: number;
+	incomplete?: boolean;
+}
+export interface WorkflowTaskUsageRecord extends WorkflowTaskUsageValues {
+	source: "pi-subagent";
+	capturedAt: string;
+	provider?: string;
+	model?: string;
+	thinking?: ThinkingLevel | string;
+	incomplete?: boolean;
+	aggregate?: WorkflowTaskUsageAggregateRecord;
+	attempts?: WorkflowTaskUsageAttemptRecord[];
+}
+export interface WorkflowTaskTimingAttemptRecord {
+	source: string;
+	capturedAt: string;
+	backendRunId?: string;
+	backendAttemptId?: string;
+	launchQueuedAt?: string;
+	launchStartedAt?: string;
+	launchCompletedAt?: string;
+	launchWaitMs?: number;
+	launchDurationMs?: number;
+	executionStartedAt?: string;
+	executionCompletedAt?: string;
+	executionMs?: number | null;
+	totalMs?: number;
+}
+export interface WorkflowTaskTimingAggregateRecord {
+	attempts: number;
+	launchWaitMs?: number | null;
+	launchDurationMs?: number | null;
+	executionMs?: number | null;
+	totalMs?: number | null;
+	incomplete?: boolean;
+}
+export interface WorkflowTaskTimingRecord {
+	source: "pi-workflow";
+	capturedAt: string;
+	launchQueuedAt?: string;
+	launchStartedAt?: string;
+	launchCompletedAt?: string;
+	launchWaitMs?: number;
+	launchDurationMs?: number;
+	launchSlotReleaseDelayMs?: number;
+	executionStartedAt?: string;
+	executionCompletedAt?: string;
+	executionMs?: number | null;
+	totalMs?: number;
+	aggregate?: WorkflowTaskTimingAggregateRecord;
+	attempts?: WorkflowTaskTimingAttemptRecord[];
+}
 export interface WorkflowTaskRunRecord {
 	taskId: string;
 	specId: string;
@@ -606,6 +707,8 @@ export interface WorkflowTaskRunRecord {
 	startedAt?: string;
 	completedAt?: string;
 	elapsedMs?: number;
+	usage?: WorkflowTaskUsageRecord;
+	timing?: WorkflowTaskTimingRecord;
 	exitCode?: number;
 	files: {
 		systemPrompt: string;
@@ -634,6 +737,13 @@ export interface WorkflowTaskRunRecord {
 		branchId?: string;
 		outputProfile?: string;
 	};
+	foreachGenerated?: {
+		placeholderSpecId: string;
+		itemHash?: string;
+		itemSourceSpecId?: string;
+		itemSourceKind?: "control" | "partial";
+		itemRef?: string;
+	};
 	launchRetry?: {
 		attempts: number;
 		maxAttempts?: number;
@@ -724,7 +834,11 @@ export interface WorkflowIndexRecord {
 		rootRunId?: string;
 		round?: number;
 		fanout?: unknown[];
-		tasks: Array<{
+		/**
+		 * Deprecated compatibility projection. New index writes omit task rows;
+		 * consumers that need task-level details should load runJson/run.json.
+		 */
+		tasks?: Array<{
 			taskId: string;
 			displayName: string;
 			agent: string;

package/src/verification-ontology.ts ADDED Viewed

@@ -0,0 +1,88 @@
+export const VERIFICATION_STATUS = Object.freeze({
+	VERIFIED: "verified",
+	PARTIALLY_SUPPORTED: "partially_supported",
+	UNSUPPORTED: "unsupported",
+	CONFLICTING: "conflicting",
+	VERIFICATION_BLOCKED: "verification_blocked",
+	UNVERIFIED: "unverified",
+} as const);
+export type VerificationStatus =
+	(typeof VERIFICATION_STATUS)[keyof typeof VERIFICATION_STATUS];
+export type TerminalVerificationStatus = Exclude<
+	VerificationStatus,
+	(typeof VERIFICATION_STATUS)["UNVERIFIED"]
+>;
+export const VERIFICATION_STATUS_VALUES = Object.freeze([
+	VERIFICATION_STATUS.VERIFIED,
+	VERIFICATION_STATUS.PARTIALLY_SUPPORTED,
+	VERIFICATION_STATUS.UNSUPPORTED,
+	VERIFICATION_STATUS.CONFLICTING,
+	VERIFICATION_STATUS.VERIFICATION_BLOCKED,
+] as const satisfies readonly TerminalVerificationStatus[]);
+export const VERIFICATION_STATUS_BUCKETS = Object.freeze({
+	[VERIFICATION_STATUS.VERIFIED]: "verified",
+	[VERIFICATION_STATUS.PARTIALLY_SUPPORTED]: "partiallySupported",
+	[VERIFICATION_STATUS.UNSUPPORTED]: "unsupported",
+	[VERIFICATION_STATUS.CONFLICTING]: "conflicting",
+	[VERIFICATION_STATUS.VERIFICATION_BLOCKED]: "verificationBlocked",
+} as const satisfies Record<TerminalVerificationStatus, string>);
+export const VERIFICATION_STATUS_LABELS = Object.freeze({
+	[VERIFICATION_STATUS.VERIFIED]: "verified",
+	[VERIFICATION_STATUS.PARTIALLY_SUPPORTED]: "partially supported",
+	[VERIFICATION_STATUS.UNSUPPORTED]: "unsupported",
+	[VERIFICATION_STATUS.CONFLICTING]: "conflicting",
+	[VERIFICATION_STATUS.VERIFICATION_BLOCKED]: "verification blocked",
+	[VERIFICATION_STATUS.UNVERIFIED]: "unverified",
+} as const satisfies Record<VerificationStatus, string>);
+export function canonicalVerificationStatus(
+	status: unknown,
+): VerificationStatus {
+	const text = String(status ?? "").trim();
+	if (!text) return VERIFICATION_STATUS.UNVERIFIED;
+	if (text === "partiallySupported") {
+		return VERIFICATION_STATUS.PARTIALLY_SUPPORTED;
+	}
+	if (text === "verificationBlocked" || text === "blocked") {
+		return VERIFICATION_STATUS.VERIFICATION_BLOCKED;
+	}
+	return Object.values(VERIFICATION_STATUS).includes(text as VerificationStatus)
+		? (text as VerificationStatus)
+		: VERIFICATION_STATUS.UNVERIFIED;
+}
+export function verificationStatusBucket(status: unknown): string {
+	const canonical = canonicalVerificationStatus(status);
+	return canonical in VERIFICATION_STATUS_BUCKETS
+		? VERIFICATION_STATUS_BUCKETS[canonical as TerminalVerificationStatus]
+		: "other";
+}
+export function isVerifiedStatus(status: unknown): boolean {
+	return canonicalVerificationStatus(status) === VERIFICATION_STATUS.VERIFIED;
+}
+export function isVerificationBlockedStatus(status: unknown): boolean {
+	return (
+		canonicalVerificationStatus(status) ===
+		VERIFICATION_STATUS.VERIFICATION_BLOCKED
+	);
+}
+const NON_VERIFIED_TERMINAL_STATUSES = new Set<VerificationStatus>([
+	VERIFICATION_STATUS.PARTIALLY_SUPPORTED,
+	VERIFICATION_STATUS.UNSUPPORTED,
+	VERIFICATION_STATUS.CONFLICTING,
+	VERIFICATION_STATUS.VERIFICATION_BLOCKED,
+]);
+export function isNonVerifiedTerminalStatus(status: unknown): boolean {
+	return NON_VERIFIED_TERMINAL_STATUSES.has(
+		canonicalVerificationStatus(status),
+	);
+}

package/src/workflow-artifact-tool.ts CHANGED Viewed

@@ -147,8 +147,7 @@ const WORKFLOW_ARTIFACT_KIND_SET = new Set<string>(WORKFLOW_ARTIFACT_KINDS);
 const DEFAULT_MAX_BYTES = 50 * 1024;
 const DEFAULT_MAX_LINES = 2000;
 const SOURCE_NAME_PATTERN = /^[A-Za-z0-9_.:-]+$/;
-const SIMPLE_JSON_PATH_PATTERN =
-	/^(\$|\$(\.[A-Za-z0-9_-]+(\[(\*|\d+|\d*:\d*)\])?)+)$/;
+const SIMPLE_JSON_PATH_PATTERN = /^(\$|\$(\.[A-Za-z0-9_-]+)+)$/;
 const JSON_PATH_SEGMENT_ALIASES: Record<string, string> = {
 	axes: "researchAxes",
 	claimVerdicts: "claimVerdictLedger",
@@ -466,15 +465,14 @@ async function readProjectedWorkflowArtifact(options: {
 		path: effectivePath,
 	});
 	const serialized = JSON.stringify(sliced.value, null, 2);
+	const maxChars = options.maxChars ?? DEFAULT_MAX_BYTES;
 	const preview =
-		options.maxChars !== undefined && serialized.length > options.maxChars
-			? serialized.slice(0, options.maxChars)
-			: serialized;
+		serialized.length > maxChars ? serialized.slice(0, maxChars) : serialized;
 	const projection: WorkflowArtifactProjectionMetadata = {
 		path: effectivePath,
 		valueType: jsonValueType(resolved),
 		...(options.maxItems === undefined ? {} : { maxItems: options.maxItems }),
-		...(options.maxChars === undefined ? {} : { maxChars: options.maxChars }),
+		maxChars,
 		...(sliced.totalItems === undefined
 			? {}
 			: { totalItems: sliced.totalItems }),
@@ -810,7 +808,7 @@ function normalizeProjectionPath(value: unknown): string | undefined {
 	if (path === undefined) return undefined;
 	if (!SIMPLE_JSON_PATH_PATTERN.test(path)) {
 		throw new Error(
-			"path must be $ or a simple dot JSON path like $.claims.items",
+			"path must be $ or a simple dot JSON path like $.claims.items; array selectors are not supported",
 		);
 	}
 	return path;

package/src/workflow-artifacts.ts CHANGED Viewed

@@ -9,6 +9,7 @@ interface WorkflowTelemetryAccumulator {
 	launchRetries: number;
 	resumeEvents: number;
 	resumedTasks: number;
+	contextLimitFailures: number;
 	retryReasons: WorkflowTelemetrySummary["retryReasons"];
 	resumeStatusCounts: StatusCounts;
 	outputRepairCounts: OutputRepairCounts;
@@ -18,6 +19,13 @@ export interface WorkflowTelemetrySummary {
 	taskCount: number;
 	wallClockMs: number | null;
 	statusCounts: StatusCounts;
+	completion: {
+		health: "clean" | "repaired" | "incomplete";
+		clean: boolean;
+		repaired: boolean;
+		repairEvents: number;
+		contextLimitFailures: number;
+	};
 	retryCounts: { output: number; launch: number };
 	retryReasons: {
 		output: Record<string, number>;
@@ -77,10 +85,23 @@ export function summarizeWorkflowTelemetry(
 		stage.outputBytes += taskOutputBytes;
 	}
+	const repairEvents =
+		accumulator.outputRetries +
+		accumulator.launchRetries +
+		accumulator.resumeEvents;
+	const health = completionHealth(tasks, repairEvents, accumulator);
 	return {
 		taskCount: tasks.length,
 		wallClockMs: durationBetween(run.createdAt, run.updatedAt),
 		statusCounts,
+		completion: {
+			health,
+			clean: health === "clean",
+			repaired: health === "repaired",
+			repairEvents,
+			contextLimitFailures: accumulator.contextLimitFailures,
+		},
 		retryCounts: {
 			output: accumulator.outputRetries,
 			launch: accumulator.launchRetries,
@@ -103,6 +124,7 @@ function createWorkflowTelemetryAccumulator(): WorkflowTelemetryAccumulator {
 		launchRetries: 0,
 		resumeEvents: 0,
 		resumedTasks: 0,
+		contextLimitFailures: 0,
 		retryReasons: { output: {}, launch: {} },
 		resumeStatusCounts: {},
 		outputRepairCounts: { sameSession: 0, newSession: 0, unknown: 0 },
@@ -113,6 +135,7 @@ function accumulateTaskReliability(
 	task: Partial<WorkflowTaskRunRecord>,
 	accumulator: WorkflowTelemetryAccumulator,
 ): void {
+	if (taskHasContextLimitFailure(task)) accumulator.contextLimitFailures += 1;
 	const currentOutputAttempts = positiveCount(task.outputRetry?.attempts);
 	accumulator.outputRetries += currentOutputAttempts;
 	if (currentOutputAttempts > 0) {
@@ -137,17 +160,40 @@ function accumulateTaskReliability(
 	for (const event of resumeEvents) accumulateResumeEvent(event, accumulator);
 }
+function completionHealth(
+	tasks: Array<Partial<WorkflowTaskRunRecord>>,
+	repairEvents: number,
+	accumulator: WorkflowTelemetryAccumulator,
+): WorkflowTelemetrySummary["completion"]["health"] {
+	const allCompleted =
+		tasks.length > 0 && tasks.every((task) => task.status === "completed");
+	if (!allCompleted) return "incomplete";
+	return repairEvents === 0 && accumulator.contextLimitFailures === 0
+		? "clean"
+		: "repaired";
+}
 function accumulateResumeEvent(
 	event: NonNullable<WorkflowTaskRunRecord["resumeEvents"]>[number],
 	accumulator: WorkflowTelemetryAccumulator,
 ): void {
 	accumulator.resumeStatusCounts[event.fromStatus] =
 		(accumulator.resumeStatusCounts[event.fromStatus] ?? 0) + 1;
+	if (resumeEventHasContextLimitFailure(event))
+		accumulator.contextLimitFailures += 1;
 	const previousOutputAttempts = positiveCount(event.outputRetryAttempts);
 	accumulator.outputRetries += previousOutputAttempts;
-	if (previousOutputAttempts === 0) return;
-	countReason(accumulator.retryReasons.output, event.outputRetryReason);
-	countRepairMode(accumulator.outputRepairCounts, event.outputRetryRepairMode);
+	if (previousOutputAttempts > 0) {
+		countReason(accumulator.retryReasons.output, event.outputRetryReason);
+		countRepairMode(
+			accumulator.outputRepairCounts,
+			event.outputRetryRepairMode,
+		);
+	}
+	const previousLaunchAttempts = positiveCount(event.launchRetryAttempts);
+	accumulator.launchRetries += previousLaunchAttempts;
+	if (previousLaunchAttempts > 0)
+		countReason(accumulator.retryReasons.launch, event.launchRetryReason);
 }
 function positiveCount(value: number | undefined): number {
@@ -172,6 +218,40 @@ function countRepairMode(
 	else counts.unknown += 1;
 }
+function taskHasContextLimitFailure(
+	task: Partial<WorkflowTaskRunRecord>,
+): boolean {
+	return [
+		task.statusDetail,
+		task.lastMessage,
+		task.outputRetry?.reason,
+		task.outputRetry?.message,
+		task.launchRetry?.reason,
+		task.launchRetry?.message,
+	].some(isContextLimitText);
+}
+function resumeEventHasContextLimitFailure(
+	event: NonNullable<WorkflowTaskRunRecord["resumeEvents"]>[number],
+): boolean {
+	return [
+		event.fromStatusDetail,
+		event.lastMessage,
+		event.outputRetryReason,
+		event.launchRetryReason,
+	].some(isContextLimitText);
+}
+function isContextLimitText(value: string | undefined): boolean {
+	const text = value?.toLowerCase() ?? "";
+	return (
+		text.includes("context_or_request_too_large") ||
+		/context (window|length)|maximum context|request too large|token limit/.test(
+			text,
+		)
+	);
+}
 export interface SourceContextPacket {
 	tasks: SourceContextTask[];
 	byStage: Record<

package/src/workflow-fetch-cache-extension.ts CHANGED Viewed

@@ -18,6 +18,7 @@ export interface WorkflowFetchCacheConfig {
 	runId: string;
 	taskId: string;
 	cacheDir: string;
+	maxInlineChars?: number;
 }
 export interface WorkflowFetchCacheExtensionWrapperOptions {
@@ -83,7 +84,7 @@ export function registerWorkflowFetchCacheExtension(
 	webAccessExtension: WebAccessExtension,
 	storage: WebAccessStorage,
 ): void {
-	let capturedFetchData: Record<string, unknown> | undefined;
+	const capturedFetchDataByResponseId = new Map<string, Record<string, unknown>>();
 	const adapter = new Proxy(pi, {
 		get(target, property, receiver) {
 			if (property === "registerTool") {
@@ -97,32 +98,43 @@ export function registerWorkflowFetchCacheExtension(
 						execute: async (toolCallId, params, signal, onUpdate) => {
 							const cacheKey = cacheKeyForParams(params);
 							if (!cacheKey) {
-								return await tool.execute!(
-									toolCallId,
-									params,
-									signal,
-									onUpdate,
+								return capFetchContentInlineResult(
+									await tool.execute!(
+										toolCallId,
+										params,
+										signal,
+										onUpdate,
+									),
+									config.maxInlineChars,
 								);
 							}
 							const hit = await readCacheRecord(config, cacheKey.key);
 							if (hit) {
 								await recordCacheEvent(config, "hit", cacheKey);
-								return materializeCacheHit(pi, storage, hit);
+								return capFetchContentInlineResult(
+									materializeCacheHit(pi, storage, hit),
+									config.maxInlineChars,
+								);
 							}
 							await recordCacheEvent(config, "miss", cacheKey);
-							capturedFetchData = undefined;
 							const result = await tool.execute!(
 								toolCallId,
 								params,
 								signal,
 								onUpdate,
 							);
-							const storedData = capturedFetchData;
-							capturedFetchData = undefined;
+							const responseId = stringValue(result.details?.responseId);
+							const storedData = responseId
+								? capturedFetchDataByResponseId.get(responseId)
+								: undefined;
+							if (responseId) capturedFetchDataByResponseId.delete(responseId);
 							const writeReason = cacheWriteSkipReason(result, storedData);
 							if (writeReason) {
 								await recordCacheEvent(config, "skip", cacheKey, writeReason);
-								return result;
+								return capFetchContentInlineResult(
+									result,
+									config.maxInlineChars,
+								);
 							}
 							await writeCacheRecord(config, {
 								schema: WORKFLOW_FETCH_CONTENT_CACHE_SCHEMA,
@@ -134,7 +146,10 @@ export function registerWorkflowFetchCacheExtension(
 								storedData: storedData!,
 							});
 							await recordCacheEvent(config, "write", cacheKey);
-							return withCacheDetails(result, { hit: false });
+							return capFetchContentInlineResult(
+								withCacheDetails(result, { hit: false }),
+								config.maxInlineChars,
+							);
 						},
 					});
 				};
@@ -142,7 +157,10 @@ export function registerWorkflowFetchCacheExtension(
 			if (property === "appendEntry") {
 				return (type: string, data: unknown) => {
 					if (type === "web-search-results" && isFetchStoredData(data)) {
-						capturedFetchData = cloneJsonObject(data);
+						const cloned = cloneJsonObject(data);
+						const responseId = stringValue(cloned?.id);
+						if (responseId && cloned)
+							capturedFetchDataByResponseId.set(responseId, cloned);
 					}
 					return pi.appendEntry?.(type, data);
 				};
@@ -300,6 +318,49 @@ function withCacheDetails(
 	};
 }
+function capFetchContentInlineResult(
+	result: ToolResult,
+	maxInlineChars: number | undefined,
+): ToolResult {
+	const maxChars = normalizeInlineCharCap(maxInlineChars);
+	if (maxChars === undefined || !Array.isArray(result.content)) return result;
+	let truncated = false;
+	const content = result.content.map((entry) => {
+		if (entry.type !== "text" || typeof entry.text !== "string")
+			return entry;
+		if (entry.text.length <= maxChars) return entry;
+		truncated = true;
+		return {
+			...entry,
+			text:
+				entry.text.slice(0, maxChars) +
+				`\n\n[Workflow inline fetch content capped at ${maxChars} chars; full source content remains in workflow source cache.]`,
+		};
+	});
+	if (!truncated) return result;
+	return {
+		...result,
+		content,
+		details: {
+			...(result.details ?? {}),
+			truncated: true,
+			workflowInlineContentCap: {
+				type: "fetch_content",
+				maxChars,
+				truncated: true,
+			},
+		},
+	};
+}
+function normalizeInlineCharCap(value: number | undefined): number | undefined {
+	if (value === undefined || !Number.isFinite(value)) return undefined;
+	const cap = Math.floor(value);
+	return cap > 0 ? cap : undefined;
+}
 function cacheWriteSkipReason(
 	result: ToolResult,
 	storedData: Record<string, unknown> | undefined,
@@ -366,6 +427,10 @@ function cloneJsonObject(value: unknown): Record<string, unknown> | undefined {
 	return JSON.parse(JSON.stringify(value)) as Record<string, unknown>;
 }
+function stringValue(value: unknown): string | undefined {
+	return typeof value === "string" && value ? value : undefined;
+}
 function isFetchStoredData(value: unknown): value is Record<string, unknown> {
 	return isRecord(value) && value.type === "fetch" && Array.isArray(value.urls);
 }