npm - @agwab/pi-workflow - Versions diffs - 0.2.1 → 0.4.0 - Mend

@agwab/pi-workflow 0.2.1 → 0.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (119) hide show

package/README.md +3 -1
package/dist/artifact-graph-runtime.d.ts +1 -1
package/dist/artifact-graph-runtime.js +10 -5
package/dist/artifact-graph-schema.js +127 -5
package/dist/compiler.js +52 -19
package/dist/dynamic-generated-task-runtime.js +3 -1
package/dist/dynamic-profiles.d.ts +1 -1
package/dist/engine-run-graph.d.ts +3 -0
package/dist/engine-run-graph.js +194 -4
package/dist/engine.d.ts +5 -0
package/dist/engine.js +389 -41
package/dist/extension.d.ts +2 -1
package/dist/extension.js +30 -8
package/dist/index.d.ts +11 -3
package/dist/index.js +6 -1
package/dist/prompt-json.d.ts +7 -0
package/dist/prompt-json.js +13 -0
package/dist/roles.d.ts +1 -1
package/dist/roles.js +5 -8
package/dist/store.d.ts +20 -1
package/dist/store.js +139 -35
package/dist/strings.d.ts +11 -0
package/dist/strings.js +24 -0
package/dist/subagent-backend.js +710 -40
package/dist/types.d.ts +107 -1
package/dist/verification-ontology.d.ts +31 -0
package/dist/verification-ontology.js +66 -0
package/dist/workflow-artifact-tool.js +5 -6
package/dist/workflow-artifacts.d.ts +7 -0
package/dist/workflow-artifacts.js +55 -4
package/dist/workflow-fetch-cache-extension.d.ts +1 -0
package/dist/workflow-fetch-cache-extension.js +57 -9
package/dist/workflow-metrics.d.ts +113 -0
package/dist/workflow-metrics.js +272 -0
package/dist/workflow-output-artifacts.js +5 -3
package/dist/workflow-partial-output.d.ts +45 -0
package/dist/workflow-partial-output.js +205 -0
package/dist/workflow-progress-health.js +42 -10
package/dist/workflow-runtime.js +10 -1
package/dist/workflow-view.js +3 -1
package/dist/workflow-web-source-extension.js +194 -52
package/dist/workflow-web-source.d.ts +2 -1
package/dist/workflow-web-source.js +109 -30
package/docs/usage.md +76 -29
package/node_modules/@agwab/pi-subagent/README.md +3 -3
package/node_modules/@agwab/pi-subagent/api.mjs +1 -0
package/node_modules/@agwab/pi-subagent/docs/usage.md +63 -12
package/node_modules/@agwab/pi-subagent/package.json +2 -2
package/node_modules/@agwab/pi-subagent/src/api.ts +54 -1
package/node_modules/@agwab/pi-subagent/src/artifacts/registry.ts +9 -4
package/node_modules/@agwab/pi-subagent/src/artifacts/result.ts +8 -0
package/node_modules/@agwab/pi-subagent/src/core/constants.ts +9 -0
package/node_modules/@agwab/pi-subagent/src/core/validation.ts +21 -0
package/node_modules/@agwab/pi-subagent/src/index.ts +1046 -576
package/node_modules/@agwab/pi-subagent/src/orchestrate/async.ts +279 -156
package/node_modules/@agwab/pi-subagent/src/orchestrate/interrupt.ts +165 -89
package/node_modules/@agwab/pi-subagent/src/orchestrate/reconcile.ts +111 -65
package/node_modules/@agwab/pi-subagent/src/orchestrate/run-ref.ts +219 -0
package/node_modules/@agwab/pi-subagent/src/orchestrate/run.ts +88 -8
package/node_modules/@agwab/pi-subagent/src/orchestrate/status.ts +614 -298
package/node_modules/@agwab/pi-subagent/src/panel.ts +1356 -560
package/node_modules/@agwab/pi-subagent/src/runners/headless-model.ts +53 -5
package/node_modules/@agwab/pi-subagent/src/runners/tmux.ts +13 -6
package/package.json +2 -2
package/skills/workflow-guide/SKILL.md +1 -0
package/src/artifact-graph-runtime.ts +19 -13
package/src/artifact-graph-schema.ts +143 -3
package/src/cli.mjs +52 -0
package/src/compiler.ts +63 -18
package/src/dynamic-generated-task-runtime.ts +3 -1
package/src/dynamic-profiles.ts +1 -1
package/src/engine-run-graph.ts +246 -4
package/src/engine.ts +545 -38
package/src/extension.ts +36 -6
package/src/index.ts +52 -1
package/src/prompt-json.ts +13 -0
package/src/roles.ts +6 -9
package/src/store.ts +194 -42
package/src/strings.ts +38 -0
package/src/subagent-backend.ts +921 -62
package/src/types.ts +116 -2
package/src/verification-ontology.ts +88 -0
package/src/workflow-artifact-tool.ts +5 -7
package/src/workflow-artifacts.ts +83 -3
package/src/workflow-fetch-cache-extension.ts +78 -13
package/src/workflow-metrics.ts +478 -0
package/src/workflow-output-artifacts.ts +5 -3
package/src/workflow-partial-output.ts +299 -0
package/src/workflow-progress-health.ts +47 -15
package/src/workflow-runtime.ts +18 -2
package/src/workflow-view.ts +2 -1
package/src/workflow-web-source-extension.ts +654 -232
package/src/workflow-web-source.ts +153 -39
package/workflows/README.md +7 -25
package/workflows/deep-research/batched-verification.spec.json +253 -0
package/workflows/deep-research/helpers/batch-verification-candidates.mjs +136 -0
package/workflows/deep-research/helpers/claim-evidence-gate.mjs +229 -36
package/workflows/deep-research/helpers/final-audit-packet.mjs +1 -4
package/workflows/deep-research/helpers/normalize-input-packet.mjs +81 -2
package/workflows/deep-research/helpers/render-executive.mjs +40 -26
package/workflows/deep-research/helpers/sanitize-verification-candidates.mjs +89 -15
package/workflows/deep-research/helpers/shadow-select-verification.mjs +229 -0
package/workflows/deep-research/helpers/verification-ontology.mjs +77 -0
package/workflows/deep-research/schemas/deep-research-executive-render-control.schema.json +3 -3
package/workflows/deep-research/schemas/deep-research-research-questions-control.schema.json +38 -0
package/workflows/deep-research/schemas/deep-research-sanitize-claims-control.schema.json +63 -0
package/workflows/deep-research/schemas/deep-research-verify-claims-batch-control.schema.json +47 -0
package/workflows/deep-research/schemas/deep-research-verify-claims-control.schema.json +13 -3
package/workflows/deep-research/spec.json +32 -12
package/workflows/impact-review/spec.json +3 -3
package/workflows/spec-review/helpers/spec-review-pipeline.mjs +1 -8
package/dist/dynamic-loader.d.ts +0 -25
package/dist/dynamic-loader.js +0 -13
package/skills/workflow-guide/scaffolds/dag-required-reads/spec.json.validate.stderr +0 -0
package/skills/workflow-guide/scaffolds/dag-required-reads/spec.json.validate.stdout +0 -13
package/src/dynamic-loader.ts +0 -49
package/workflows/impact-review/schemas/docs-release-impact-control.schema.json +0 -42
package/workflows/impact-review/schemas/security-performance-impact-control.schema.json +0 -42
package/workflows/impact-review/schemas/state-data-impact-control.schema.json +0 -42

package/dist/workflow-view.js CHANGED Viewed

@@ -953,12 +953,14 @@ function statusForSummary(summary) {
         return "running";
     if (summary.blocked > 0)
         return "blocked";
-    if (summary.failed > 0 || summary.interrupted > 0)
+    if (summary.failed > 0)
         return "failed";
     if (summary.pending > 0)
         return "pending";
     if (summary.total > 0 && summary.completed === summary.total)
         return "completed";
+    if (summary.interrupted > 0)
+        return "interrupted";
     return "interrupted";
 }
 function taskElapsed(task) {

package/dist/workflow-web-source-extension.js CHANGED Viewed

@@ -72,14 +72,26 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
         name: "workflow_web_fetch_source",
         description: "Fetch one or more URLs into the workflow web-source cache and return compact source cards with sourceRefs.",
         parameters: Type.Object({
-            url: Type.Optional(Type.String({ description: "Single URL to fetch into the workflow web-source cache." })),
-            urls: Type.Optional(Type.Array(Type.String(), { description: "Multiple URLs to fetch in one tool call. Prefer this over repeated fetch calls when caching several promising sources." })),
+            url: Type.Optional(Type.String({
+                description: "Single URL to fetch into the workflow web-source cache.",
+            })),
+            urls: Type.Optional(Type.Array(Type.String(), {
+                description: "Multiple URLs to fetch in one tool call. Prefer this over repeated fetch calls when caching several promising sources.",
+            })),
             sources: Type.Optional(Type.Array(Type.Object({
-                url: Type.String({ description: "URL to fetch into the workflow web-source cache." }),
+                url: Type.String({
+                    description: "URL to fetch into the workflow web-source cache.",
+                }),
                 title: Type.Optional(Type.String({ description: "Optional source title override." })),
-            }), { description: "Multiple URL/title objects to fetch in one tool call." })),
-            title: Type.Optional(Type.String({ description: "Optional source title override for single-url fetches." })),
-            titles: Type.Optional(Type.Array(Type.String(), { description: "Optional title overrides paired by index with urls." })),
+            }), {
+                description: "Multiple URL/title objects to fetch in one tool call.",
+            })),
+            title: Type.Optional(Type.String({
+                description: "Optional source title override for single-url fetches.",
+            })),
+            titles: Type.Optional(Type.Array(Type.String(), {
+                description: "Optional title overrides paired by index with urls.",
+            })),
         }),
         execute: async (toolCallId, params, signal, onUpdate, ctx) => {
             const batchRequested = fetchSourceBatchRequested(params);
@@ -101,8 +113,12 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                         url: sanitizeUrlForModel(request.url),
                         status: typeof payload.status === "string" ? payload.status : "unknown",
                         ...(typeof payload.code === "string" ? { code: payload.code } : {}),
-                        ...(typeof payload.message === "string" ? { message: payload.message } : {}),
-                        ...(typeof card?.sourceRef === "string" ? { sourceRef: card.sourceRef } : {}),
+                        ...(typeof payload.message === "string"
+                            ? { message: payload.message }
+                            : {}),
+                        ...(typeof card?.sourceRef === "string"
+                            ? { sourceRef: card.sourceRef }
+                            : {}),
                         ...(card ? { cardIndex: cards.length - 1 } : {}),
                     });
                 }
@@ -159,10 +175,15 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                 url: existing.redactedUrl,
                 visibleChars: budget.used,
             });
-            return toolResultFromJson({ status: "ok", tool: "workflow_web_fetch_source", card });
+            return toolResultFromJson({
+                status: "ok",
+                tool: "workflow_web_fetch_source",
+                card,
+            });
         }
         const fetchKey = sourceUrlCacheKey(fetchUrl);
-        const cachedFailure = fetchFailures.get(fetchKey) ?? await readDurableFetchFailure(config, fetchKey);
+        const cachedFailure = fetchFailures.get(fetchKey) ??
+            (await readDurableFetchFailure(config, fetchKey));
         if (cachedFailure) {
             fetchFailures.set(fetchKey, cachedFailure);
             await recordWorkflowWebSourceEvent(config, "fetch_negative_cache_hit", {
@@ -178,25 +199,43 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
             if (!source)
                 return result;
             sourceCache.set(source.sourceRef, source);
-            const card = buildWorkflowWebSourceCard({ source, policy, budget, duplicate: true });
+            const card = buildWorkflowWebSourceCard({
+                source,
+                policy,
+                budget,
+                duplicate: true,
+            });
             await recordWorkflowWebSourceEvent(config, "fetch_duplicate", {
                 sourceRef: source.sourceRef,
                 url: source.redactedUrl,
                 visibleChars: budget.used,
             });
-            return toolResultFromJson({ status: "ok", tool: "workflow_web_fetch_source", card });
+            return toolResultFromJson({
+                status: "ok",
+                tool: "workflow_web_fetch_source",
+                card,
+            });
         }
         const fetchPromise = withWorkflowWebFetchLock(config, fetchKey, signal, async () => {
             const lockedExisting = await findWorkflowWebSourceByUrl(config, fetchUrl);
             if (lockedExisting) {
                 sourceCache.set(lockedExisting.sourceRef, lockedExisting);
-                const card = buildWorkflowWebSourceCard({ source: lockedExisting, policy, budget, duplicate: true });
+                const card = buildWorkflowWebSourceCard({
+                    source: lockedExisting,
+                    policy,
+                    budget,
+                    duplicate: true,
+                });
                 await recordWorkflowWebSourceEvent(config, "fetch_duplicate", {
                     sourceRef: lockedExisting.sourceRef,
                     url: lockedExisting.redactedUrl,
                     visibleChars: budget.used,
                 });
-                return toolResultFromJson({ status: "ok", tool: "workflow_web_fetch_source", card });
+                return toolResultFromJson({
+                    status: "ok",
+                    tool: "workflow_web_fetch_source",
+                    card,
+                });
             }
             const lockedFailure = await readDurableFetchFailure(config, fetchKey);
             if (lockedFailure) {
@@ -221,7 +260,10 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                     return await cachedFetchFailureResult(config, fetchFailures, fetchKey, {
                         code: "blocked_url",
                         message: "URL was blocked by workflow web-source security policy before content fetch.",
-                        extra: { reason: safeFetch.reason, url: sanitizeUrlForModel(safeFetch.url) },
+                        extra: {
+                            reason: safeFetch.reason,
+                            url: sanitizeUrlForModel(safeFetch.url),
+                        },
                         reason: safeFetch.reason,
                     });
                 }
@@ -311,10 +353,16 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                 textChars: source.textChars,
                 visibleChars: budget.used,
             });
-            return toolResultFromJson({ status: "ok", tool: "workflow_web_fetch_source", card });
+            return toolResultFromJson({
+                status: "ok",
+                tool: "workflow_web_fetch_source",
+                card,
+            });
         }).catch(async (error) => {
             const message = error instanceof Error ? error.message : "workflow_web_fetch_failed";
-            const code = message === "fetch_lock_timeout" ? "fetch_lock_timeout" : "workflow_web_fetch_failed";
+            const code = message === "fetch_lock_timeout"
+                ? "fetch_lock_timeout"
+                : "workflow_web_fetch_failed";
             await recordWorkflowWebSourceEvent(config, "fetch_failed", {
                 url: sanitizeUrlForModel(fetchUrl),
                 code,
@@ -335,23 +383,47 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
         name: "workflow_web_source_read",
         description: "Read one or more narrow exact/fuzzy/term-matched snippets from a cached workflow web source by sourceRef.",
         parameters: Type.Object({
-            sourceRef: Type.String({ description: "Opaque sourceRef returned by workflow_web_fetch_source." }),
-            query: Type.Optional(Type.String({ description: "Exact or fuzzy text to locate in the cached source." })),
-            queries: Type.Optional(Type.Array(Type.String(), { description: "Multiple exact/fuzzy texts to locate in one cached source. Prefer this over repeated calls when reading several snippets from the same sourceRef." })),
-            exact: Type.Optional(Type.String({ description: "Exact text to locate in the cached source." })),
-            exactTexts: Type.Optional(Type.Array(Type.String(), { description: "Multiple exact texts to locate in one cached source." })),
-            claim: Type.Optional(Type.String({ description: "Claim to locate when the exact quote is not known. Use with terms for deterministic quote harvesting." })),
-            terms: Type.Optional(Type.Array(Type.String(), { description: "Important terms that should co-occur in the returned source window." })),
+            sourceRef: Type.String({
+                description: "Opaque sourceRef returned by workflow_web_fetch_source.",
+            }),
+            query: Type.Optional(Type.String({
+                description: "Exact or fuzzy text to locate in the cached source.",
+            })),
+            queries: Type.Optional(Type.Array(Type.String(), {
+                description: "Multiple exact/fuzzy texts to locate in one cached source. Prefer this over repeated calls when reading several snippets from the same sourceRef.",
+            })),
+            exact: Type.Optional(Type.String({
+                description: "Exact text to locate in the cached source.",
+            })),
+            exactTexts: Type.Optional(Type.Array(Type.String(), {
+                description: "Multiple exact texts to locate in one cached source.",
+            })),
+            claim: Type.Optional(Type.String({
+                description: "Claim to locate when the exact quote is not known. Use with terms for deterministic quote harvesting.",
+            })),
+            terms: Type.Optional(Type.Array(Type.String(), {
+                description: "Important terms that should co-occur in the returned source window.",
+            })),
             reads: Type.Optional(Type.Array(Type.Object({
                 query: Type.Optional(Type.String({ description: "Exact or fuzzy text to locate." })),
                 exact: Type.Optional(Type.String({ description: "Exact text to locate." })),
                 exactText: Type.Optional(Type.String({ description: "Exact text to locate." })),
                 text: Type.Optional(Type.String({ description: "Text to locate." })),
-                claim: Type.Optional(Type.String({ description: "Claim to locate when exact quote is unknown." })),
-                terms: Type.Optional(Type.Array(Type.String(), { description: "Important terms for deterministic quote harvesting." })),
-                maxChars: Type.Optional(Type.Number({ description: "Maximum visible snippet characters for this read." })),
-            }), { description: "Mixed batch reads for one sourceRef; each item can use query or claim+terms." })),
-            maxChars: Type.Optional(Type.Number({ description: "Maximum visible snippet characters per query." })),
+                claim: Type.Optional(Type.String({
+                    description: "Claim to locate when exact quote is unknown.",
+                })),
+                terms: Type.Optional(Type.Array(Type.String(), {
+                    description: "Important terms for deterministic quote harvesting.",
+                })),
+                maxChars: Type.Optional(Type.Number({
+                    description: "Maximum visible snippet characters for this read.",
+                })),
+            }), {
+                description: "Mixed batch reads for one sourceRef; each item can use query or claim+terms.",
+            })),
+            maxChars: Type.Optional(Type.Number({
+                description: "Maximum visible snippet characters per query.",
+            })),
         }),
         execute: async (_toolCallId, params) => {
             const sourceRef = stringParam(params, "sourceRef") ?? stringParam(params, "source_ref");
@@ -361,7 +433,9 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
             }
             const source = await readCachedWorkflowWebSource(sourceRef);
             if (!source) {
-                await recordWorkflowWebSourceEvent(config, "source_read_missing", { sourceRef });
+                await recordWorkflowWebSourceEvent(config, "source_read_missing", {
+                    sourceRef,
+                });
                 return errorToolResult("source_not_found", "No cached workflow web source exists for sourceRef.", {
                     sourceRef,
                 });
@@ -391,6 +465,7 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                     missingTerms: read.missingTerms,
                     coverageRatio: read.coverageRatio,
                     candidateOnly: read.candidateOnly,
+                    truncated: read.truncated,
                     quote: status === "budget_exhausted" ? undefined : read.quote,
                     startOffset: read.startOffset,
                     endOffset: read.endOffset,
@@ -420,25 +495,33 @@ export function registerWorkflowWebSourceExtension(pi, config, providerExtension
                     missingTerms: result.missingTerms,
                     coverageRatio: result.coverageRatio,
                     candidateOnly: result.candidateOnly,
+                    truncated: result.truncated,
                     quote: result.status === "budget_exhausted" ? undefined : result.quote,
                     startOffset: result.startOffset,
                     endOffset: result.endOffset,
-                    budget: budgetSnapshot(result.status === "budget_exhausted"),
+                    budget: budgetSnapshot(result.status === "budget_exhausted" ||
+                        result.status === "truncated"),
                     next: result.status === "budget_exhausted"
                         ? "Visible web-source budget is exhausted for this task; cite the sourceRef as an evidence gap or use a smaller query in a fresh task."
-                        : undefined,
+                        : result.status === "truncated"
+                            ? "The matched web-source snippet was truncated by the visible budget or maxChars; use a smaller exact query or a fresh task if the full quote is required."
+                            : undefined,
                 });
             }
+            const hasBudgetExhaustedRead = results.some((result) => result.status === "budget_exhausted");
+            const hasTruncatedRead = results.some((result) => result.status === "truncated");
             return toolResultFromJson({
                 status: responseStatus,
                 tool: "workflow_web_source_read",
                 sourceRef,
                 url: source.redactedUrl,
                 results,
-                budget: budgetSnapshot(results.some((result) => result.status === "budget_exhausted")),
-                next: responseStatus === "budget_exhausted"
+                budget: budgetSnapshot(hasBudgetExhaustedRead || hasTruncatedRead),
+                next: hasBudgetExhaustedRead
                     ? "Visible web-source budget is exhausted for this task; cite missing quotes as evidence gaps or use smaller query batches in a fresh task."
-                    : undefined,
+                    : hasTruncatedRead
+                        ? "One or more matched web-source snippets were truncated by the visible budget or maxChars; use smaller exact queries or a fresh task if full quotes are required."
+                        : undefined,
             });
         },
     });
@@ -525,8 +608,8 @@ async function cachedFetchFailureResult(config, cache, key, failure) {
     }
     return errorToolResult(failure.code, failure.message, failure.extra);
 }
-const FETCH_LOCK_STALE_MS = 60_000;
-const FETCH_LOCK_WAIT_MS = 75_000;
+const FETCH_LOCK_STALE_MS = 4 * 60_000;
+const FETCH_LOCK_WAIT_MS = 5 * 60_000;
 async function withWorkflowWebFetchLock(config, key, signal, fn) {
     const release = await acquireWorkflowWebFetchLock(config, key, signal);
     try {
@@ -544,10 +627,11 @@ async function acquireWorkflowWebFetchLock(config, key, signal) {
         if (signal?.aborted)
             throw new Error("aborted");
         try {
+            const ownerId = `${process.pid}:${Date.now()}:${Math.random().toString(36).slice(2)}`;
             await mkdir(lockDir);
-            await writeFile(resolve(lockDir, "owner.json"), `${JSON.stringify({ pid: process.pid, createdAt: new Date().toISOString(), key }, null, 2)}\n`, "utf8");
+            await writeFile(resolve(lockDir, "owner.json"), `${JSON.stringify({ ownerId, pid: process.pid, createdAt: new Date().toISOString(), key }, null, 2)}\n`, "utf8");
             return async () => {
-                await rm(lockDir, { recursive: true, force: true });
+                await releaseWorkflowWebFetchLock(lockDir, ownerId);
             };
         }
         catch (error) {
@@ -561,6 +645,17 @@ async function acquireWorkflowWebFetchLock(config, key, signal) {
         }
     }
 }
+async function releaseWorkflowWebFetchLock(lockDir, ownerId) {
+    try {
+        const current = await readFetchLockOwner(lockDir);
+        if (current?.ownerId !== ownerId)
+            return;
+        await rm(lockDir, { recursive: true, force: true });
+    }
+    catch {
+        // Missing or unreadable lock will be retried by the caller.
+    }
+}
 async function removeStaleFetchLock(lockDir) {
     try {
         const current = await stat(lockDir);
@@ -572,6 +667,17 @@ async function removeStaleFetchLock(lockDir) {
         // Missing or unreadable lock will be retried by the caller.
     }
 }
+async function readFetchLockOwner(lockDir) {
+    try {
+        const parsed = JSON.parse(await readFile(resolve(lockDir, "owner.json"), "utf8"));
+        return isRecord(parsed) && typeof parsed.ownerId === "string"
+            ? { ownerId: parsed.ownerId }
+            : undefined;
+    }
+    catch {
+        return undefined;
+    }
+}
 async function readDurableFetchFailure(config, key) {
     try {
         const parsed = JSON.parse(await readFile(fetchFailurePath(config, key), "utf8"));
@@ -596,7 +702,9 @@ function normalizeFetchFailure(value) {
         message: value.message,
         extra,
         ...(typeof value.reason === "string" ? { reason: value.reason } : {}),
-        ...(typeof value.createdAt === "string" ? { createdAt: value.createdAt } : {}),
+        ...(typeof value.createdAt === "string"
+            ? { createdAt: value.createdAt }
+            : {}),
     };
 }
 function fetchLockPath(config, key) {
@@ -621,7 +729,9 @@ function shouldCacheFetchFailure(reason) {
         reason === "unsupported_content_type");
 }
 function shouldCacheFetchFailureInMemory(reason) {
-    return reason === "empty_source" || reason === "dns_resolution_failed" || reason.includes("ENOTFOUND");
+    return (reason === "empty_source" ||
+        reason === "dns_resolution_failed" ||
+        reason.includes("ENOTFOUND"));
 }
 const WORKFLOW_WEB_FETCH_TIMEOUT_MS = 30_000;
 const WORKFLOW_WEB_FETCH_MAX_CHARS = 1_000_000;
@@ -636,12 +746,20 @@ async function safeFetchWorkflowWebText(url, security, signal) {
             return response;
         if (response.status >= 300 && response.status < 400) {
             if (!response.location)
-                return { ok: false, reason: "redirect_without_location", url: checked.normalizedUrl };
+                return {
+                    ok: false,
+                    reason: "redirect_without_location",
+                    url: checked.normalizedUrl,
+                };
             current = new URL(response.location, checked.normalizedUrl).href;
             continue;
         }
         if (response.status < 200 || response.status >= 300) {
-            return { ok: false, reason: `http_${response.status}`, url: checked.normalizedUrl };
+            return {
+                ok: false,
+                reason: `http_${response.status}`,
+                url: checked.normalizedUrl,
+            };
         }
         const extracted = extractWorkflowWebResponseText(response.text, response.contentType);
         return {
@@ -675,13 +793,17 @@ function safeFetchOnce(url, security, signal) {
                 lookupPublicAddress(hostname, security)
                     .then((address) => {
                     if (isLookupAllOptions(options)) {
-                        callback(null, [{ address: address.address, family: address.family }]);
+                        callback(null, [
+                            { address: address.address, family: address.family },
+                        ]);
                         return;
                     }
                     callback(null, address.address, address.family);
                 })
                     .catch((error) => {
-                    const reason = error instanceof Error ? error.message : "dns_resolution_failed";
+                    const reason = error instanceof Error
+                        ? error.message
+                        : "dns_resolution_failed";
                     callback(new Error(reason), "", 4);
                 });
             },
@@ -693,7 +815,10 @@ function safeFetchOnce(url, security, signal) {
                 ? res.headers["content-type"][0]
                 : res.headers["content-type"];
             const status = res.statusCode ?? 0;
-            if (status >= 200 && status < 300 && contentType && !isWorkflowWebTextContentType(contentType)) {
+            if (status >= 200 &&
+                status < 300 &&
+                contentType &&
+                !isWorkflowWebTextContentType(contentType)) {
                 res.resume();
                 settle({ ok: false, reason: "unsupported_content_type", url });
                 return;
@@ -772,7 +897,10 @@ async function validateResolvedHost(url, security) {
         return { ok: false, reason: "invalid_url", url };
     }
     try {
-        const addresses = await lookup(parsed.hostname, { all: true, verbatim: true });
+        const addresses = await lookup(parsed.hostname, {
+            all: true,
+            verbatim: true,
+        });
         for (const address of addresses) {
             const reason = privateIpReason(address.address);
             if (reason)
@@ -800,7 +928,8 @@ function privateIpReason(address) {
     }
     if (isIP(lower) === 4) {
         const parts = lower.split(".").map((part) => Number(part));
-        if (parts.length !== 4 || parts.some((part) => !Number.isInteger(part) || part < 0 || part > 255))
+        if (parts.length !== 4 ||
+            parts.some((part) => !Number.isInteger(part) || part < 0 || part > 255))
             return "private_host_blocked";
         const [a, b, c, d] = parts;
         if (a === 0 || a === 10 || a === 127 || a >= 224)
@@ -961,7 +1090,9 @@ function fetchSourceRequestsFromParams(params) {
     const titles = Array.isArray(params.titles) ? params.titles : [];
     if (Array.isArray(params.sources)) {
         for (const source of params.sources) {
-            if (!isRecord(source) || typeof source.url !== "string" || !source.url.trim())
+            if (!isRecord(source) ||
+                typeof source.url !== "string" ||
+                !source.url.trim())
                 continue;
             requests.push({
                 url: source.url.trim(),
@@ -978,7 +1109,9 @@ function fetchSourceRequestsFromParams(params) {
             const title = titles[index];
             requests.push({
                 url: url.trim(),
-                ...(typeof title === "string" && title.trim() ? { title: title.trim() } : {}),
+                ...(typeof title === "string" && title.trim()
+                    ? { title: title.trim() }
+                    : {}),
             });
         }
     }
@@ -1086,12 +1219,18 @@ function dedupeSourceReadRequests(requests) {
     return deduped;
 }
 function sourceReadBatchRequested(params) {
-    return ((isRecord(params) && Array.isArray(params.reads) && params.reads.length > 0) ||
+    return ((isRecord(params) &&
+        Array.isArray(params.reads) &&
+        params.reads.length > 0) ||
         stringArrayParam(params, "queries").length > 0 ||
         stringArrayParam(params, "exactTexts").length > 0 ||
         stringArrayParam(params, "texts").length > 0);
 }
 function sourceReadResponseStatus(read) {
+    if (read.status === "truncated" && !read.quote)
+        return "budget_exhausted";
+    if (read.status === "truncated")
+        return "truncated";
     if (read.status === "matched" && !read.quote)
         return "budget_exhausted";
     if (read.status === "matched" && read.candidateOnly)
@@ -1105,6 +1244,8 @@ function aggregateSourceReadStatus(statuses) {
         return "ok";
     if (statuses.every((status) => status === "candidate"))
         return "candidate";
+    if (statuses.every((status) => status === "truncated"))
+        return "truncated";
     if (statuses.every((status) => status === "not_found"))
         return "not_found";
     if (statuses.every((status) => status === "budget_exhausted"))
@@ -1140,7 +1281,8 @@ function isWorkflowWebTextContentType(contentType) {
     return /^(text\/|application\/(json|xml|xhtml\+xml|ld\+json)|[^;]+\+json\b|[^;]+\+xml\b)/i.test(contentType.trim());
 }
 function extractWorkflowWebResponseText(text, contentType) {
-    const looksHtml = /html/i.test(contentType ?? "") || /<html[\s>]|<body[\s>]|<title[\s>]/i.test(text);
+    const looksHtml = /html/i.test(contentType ?? "") ||
+        /<html[\s>]|<body[\s>]|<title[\s>]/i.test(text);
     if (!looksHtml) {
         return { text, title: titleFromPlainText(text) };
     }

package/dist/workflow-web-source.d.ts CHANGED Viewed

@@ -67,7 +67,7 @@ export interface WorkflowWebSourceReadRequest {
     maxChars?: number;
 }
 export interface WorkflowWebSourceReadResult {
-    status: "matched" | "not_found";
+    status: "matched" | "truncated" | "not_found";
     matchType?: "exact" | "normalized" | "terms";
     quote?: string;
     startOffset?: number;
@@ -77,6 +77,7 @@ export interface WorkflowWebSourceReadResult {
     missingTerms?: string[];
     coverageRatio?: number;
     candidateOnly?: boolean;
+    truncated?: boolean;
 }
 export interface WorkflowWebSourceCard {
     sourceRef: string;