npm - pi-web-toolkit - Versions diffs - 0.1.1 → 0.2.0 - Mend

pi-web-toolkit 0.1.1 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/README.md +89 -43
package/docs/agents/domain.md +51 -0
package/docs/agents/issue-tracker.md +22 -0
package/docs/agents/triage-labels.md +15 -0
package/docs/guide.md +1 -1
package/docs/tools.md +6 -2
package/extensions/utils/agent-browser.ts +179 -0
package/extensions/utils/cli-runner.ts +108 -0
package/extensions/utils/content-preview.ts +493 -0
package/extensions/utils/output-sink.ts +67 -0
package/extensions/utils/render-helpers.ts +77 -0
package/extensions/utils/scrapling.ts +39 -24
package/extensions/utils/tool-factory.ts +79 -0
package/extensions/web_batch_fetch.ts +155 -47
package/extensions/web_browse.ts +158 -256
package/extensions/web_fetch.ts +83 -42
package/extensions/web_search.ts +140 -56
package/package.json +9 -1

package/extensions/utils/scrapling.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { spawn } from "node:child_process";
+import { runCLI } from "./cli-runner";
 /**
  * Run a scrapling CLI command with optional abort signal.
@@ -7,30 +7,45 @@ export function runScrapling(
   args: string[],
   signal?: AbortSignal,
 ): Promise<{ stdout: string; stderr: string; exitCode: number }> {
-  return new Promise((resolve) => {
-    const proc = spawn("scrapling", args, { shell: false, stdio: ["ignore", "pipe", "pipe"] });
-    let stdout = "";
-    let stderr = "";
+  return runCLI({ command: "scrapling", args, signal });
+}
+/**
+ * Run scrapling fetch with automatic fallback to HTTP GET on failure.
+ *
+ * @param url       Target URL
+ * @param tmpFile   Output markdown file path
+ * @param options   { selector?: string; stealthy?: boolean; noGetFallback?: boolean }
+ * @param signal    Optional AbortSignal
+ * @returns         { ok: true } or { ok: false, stderr: string }
+ */
+export async function runScraplingWithFallback(
+  url: string,
+  tmpFile: string,
+  options: { selector?: string; stealthy?: boolean; noGetFallback?: boolean },
+  signal?: AbortSignal,
+): Promise<{ ok: boolean; stderr?: string }> {
+  const cmd = options.stealthy ? "stealthy-fetch" : "fetch";
+  const args = ["extract", cmd, url, tmpFile, "--ai-targeted"];
+  if (options.selector) {
+    args.push("--css-selector", options.selector);
+  }
-    proc.stdout.on("data", (data) => {
-      stdout += data.toString();
-    });
-    proc.stderr.on("data", (data) => {
-      stderr += data.toString();
-    });
-    proc.on("close", (code, closeSignal) => {
-      const exitCode = code ?? 1;
-      const signalMessage = closeSignal ? `Process terminated by ${closeSignal}` : "";
-      resolve({ stdout, stderr: stderr || signalMessage, exitCode });
-    });
-    proc.on("error", (err) => resolve({ stdout, stderr: err.message, exitCode: 1 }));
+  const result = await runScrapling(args, signal);
+  if (result.exitCode === 0) {
+    return { ok: true };
+  }
-    if (signal) {
-      const kill = () => {
-        proc.kill("SIGTERM");
-      };
-      if (signal.aborted) kill();
-      else signal.addEventListener("abort", kill, { once: true });
+  if (!options.noGetFallback) {
+    const fallback = await runScrapling(
+      ["extract", "get", url, tmpFile, "--ai-targeted"],
+      signal,
+    );
+    if (fallback.exitCode === 0) {
+      return { ok: true };
     }
-  });
+    return { ok: false, stderr: result.stderr || fallback.stderr };
+  }
+  return { ok: false, stderr: result.stderr };
 }

package/extensions/utils/tool-factory.ts ADDED Viewed

@@ -0,0 +1,79 @@
+/**
+ * Tool factory — separates execution from TUI rendering
+ *
+ * Provides a defineWebTool helper that wraps tool definitions with
+ * consistent base behaviour, while letting each tool supply its own
+ * execution logic and optional custom renderers.
+ */
+import { defineTool, formatSize } from "@earendil-works/pi-coding-agent";
+import { Text } from "@earendil-works/pi-tui";
+/**
+ * Shared render utilities for custom renderResult implementations.
+ */
+export const RenderUtils = {
+  /** Truncate preview text to maxLen, adding ellipsis. */
+  truncatePreview(text: string, maxLen: number): string {
+    if (text.length <= maxLen) return text;
+    return text.slice(0, maxLen).replace(/\s+\S*$/, "") + "...";
+  },
+  /** Render the "Full output: path" line. */
+  fullOutputLine(path: string | undefined, theme: any): string {
+    return path ? `\n${theme.fg("accent", `Full output: ${path}`)}` : "";
+  },
+  /** Format a byte count using the shared formatter. */
+  formatBytes(bytes: number): string {
+    return formatSize(bytes);
+  },
+};
+/**
+ * Default renderCall implementation: shows tool name and first string argument.
+ */
+export function defaultRenderCall(name: string, args: Record<string, unknown>, theme: any): Text {
+  let text = theme.fg("toolTitle", theme.bold(`${name} `));
+  const firstString = Object.values(args).find((v) => typeof v === "string");
+  if (firstString) {
+    text += theme.fg("muted", firstString as string);
+  }
+  return new Text(text, 0, 0);
+}
+/**
+ * Default renderResult implementation: shows success and full output path.
+ */
+export function defaultRenderResult(
+  result: { content: Array<{ type: "text"; text: string }>; details?: unknown },
+  state: { expanded: boolean; isPartial: boolean },
+  theme: any,
+): Text {
+  if (state.isPartial) {
+    return new Text(theme.fg("warning", "Running..."), 0, 0);
+  }
+  const details = result.details as { fullOutputPath?: string } | undefined;
+  let text = theme.fg("success", "✓ Done");
+  if (state.expanded && details?.fullOutputPath) {
+    text += `\n${theme.fg("accent", `Full output: ${details.fullOutputPath}`)}`;
+  }
+  return new Text(text, 0, 0);
+}
+/**
+ * Register a web tool with consistent base behaviour.
+ *
+ * This is a thin wrapper around defineTool that applies default
+ * renderCall/renderResult when the tool does not supply its own.
+ *
+ * NOTE: The pi framework's TypeBox types make strict typing here difficult.
+ * Callers should rely on type inference at the call site.
+ */
+export function defineWebTool(def: any) {
+  return defineTool({
+    ...def,
+    renderCall: def.renderCall ?? ((args: any, theme: any) => defaultRenderCall(def.name, args, theme)),
+    renderResult: def.renderResult ?? ((result: any, state: any, theme: any) => defaultRenderResult(result, state, theme)),
+  });
+}

package/extensions/web_batch_fetch.ts CHANGED Viewed

@@ -14,7 +14,6 @@
 import {
   defineTool,
   type ExtensionAPI,
-  truncateHead,
   formatSize,
   DEFAULT_MAX_BYTES,
   DEFAULT_MAX_LINES,
@@ -24,7 +23,10 @@ import { Type, type Static } from "typebox";
 import * as fs from "node:fs";
 import * as os from "node:os";
 import * as path from "node:path";
-import { runScrapling } from "./utils/scrapling";
+import { runScraplingWithFallback } from "./utils/scrapling";
+import { extractPreview } from "./utils/content-preview";
+import { writeWithFallback } from "./utils/output-sink";
+import { abbreviateUrl, getErrorText, normalizeWhitespace } from "./utils/render-helpers";
 interface FetchTask {
   url: string;
@@ -37,18 +39,15 @@ async function fetchOne(
   stealthy: boolean,
   signal?: AbortSignal,
 ): Promise<{ url: string; content: string; size: number; ok: boolean; error?: string }> {
-  const cmd = stealthy ? "stealthy-fetch" : "fetch";
-  const args = ["extract", cmd, task.url, task.tmpFile, "--ai-targeted"];
-  if (selector) args.push("--css-selector", selector);
+  const { ok: fetchOk, stderr } = await runScraplingWithFallback(
+    task.url,
+    task.tmpFile,
+    { selector, stealthy },
+    signal,
+  );
-  const { stderr, exitCode } = await runScrapling(args, signal);
-  if (exitCode !== 0) {
-    // Fallback to GET
-    const fallback = await runScrapling(["extract", "get", task.url, task.tmpFile, "--ai-targeted"], signal);
-    if (fallback.exitCode !== 0) {
-      return { url: task.url, content: "", size: 0, ok: false, error: stderr || fallback.stderr };
-    }
+  if (!fetchOk) {
+    return { url: task.url, content: "", size: 0, ok: false, error: stderr };
   }
   try {
@@ -84,9 +83,9 @@ async function mapWithConcurrencyLimit<TIn, TOut>(
 export const WebBatchFetchParamsSchema = Type.Object({
   urls: Type.Array(Type.String(), {
-    description: "List of URLs to fetch (2–5 recommended)",
+    description: "List of URLs to fetch (2–5 recommended, max 15)",
     minItems: 1,
-    maxItems: 10,
+    maxItems: 15,
   }),
   selector: Type.Optional(Type.String({
     description: "CSS selector applied to ALL pages to extract only relevant content",
@@ -117,11 +116,12 @@ const webBatchFetchTool = defineTool({
   ].join(" "),
   promptSnippet: "Fetch multiple URLs in parallel for research",
   promptGuidelines: [
-    "Use web_batch_fetch when web_search returns multiple (2–5) relevant pages and the agent needs to read them all.",
+    "Use web_batch_fetch when web_search returns multiple (2–5) relevant pages and the agent needs to read them all at once.",
+    "Prefer web_batch_fetch over repeated web_fetch calls when reading multiple pages for comparison or synthesis.",
     "Use web_batch_fetch for cross-referencing sources, comparing implementations, or synthesizing research from multiple sites.",
     "For a single URL, always use web_fetch — it supports per-URL selectors and stealthy mode.",
     "If a page in the batch fails, the tool reports the error but continues with the others.",
-    "Keep batch sizes small (≤5) to avoid overwhelming the browser and token budget.",
+    "Keep batch sizes reasonable (≤8) to avoid overwhelming the browser and token budget.",
   ],
   parameters: WebBatchFetchParamsSchema,
@@ -132,17 +132,48 @@ const webBatchFetchTool = defineTool({
       tmpFile: path.join(tmpDir, `page-${i}.md`),
     }));
     let fullOutputPath: string | undefined;
+    const concurrency = Math.floor(Math.min(5, Math.max(1, params.max_concurrency ?? 3)));
-    try {
-      const concurrency = Math.floor(Math.min(5, Math.max(1, params.max_concurrency ?? 3)));
-      onUpdate?.({ content: [{ type: "text", text: `Fetching ${tasks.length} pages with concurrency ${concurrency}...` }], details: {} });
+    // Progress tracking for live UI updates
+    const progressItems = tasks.map((t) => ({
+      url: t.url,
+      status: "fetching" as "fetching" | "done" | "error",
+      size: 0,
+      error: "",
+    }));
+    const sendProgress = () => {
+      const completed = progressItems.filter((p) => p.status !== "fetching").length;
+      const succeeded = progressItems.filter((p) => p.status === "done").length;
+      const failed = progressItems.filter((p) => p.status === "error").length;
+      onUpdate?.({
+        content: [{ type: "text", text: `Fetching ${tasks.length} pages (${completed}/${tasks.length})...` }],
+        details: {
+          progress: {
+            total: tasks.length,
+            completed,
+            succeeded,
+            failed,
+            items: progressItems.map((p) => ({ ...p })),
+          },
+        },
+      });
+    };
+    sendProgress();
+    try {
       const results = await mapWithConcurrencyLimit(
         tasks,
         concurrency,
         (task, index) => {
-          onUpdate?.({ content: [{ type: "text", text: `Fetching ${task.url} (${index + 1}/${tasks.length})...` }], details: {} });
-          return fetchOne(task, params.selector, params.stealthy ?? false, signal);
+          return fetchOne(task, params.selector, params.stealthy ?? false, signal).then((res) => {
+            progressItems[index].status = res.ok ? "done" : "error";
+            progressItems[index].size = res.size;
+            progressItems[index].error = res.error || "";
+            sendProgress();
+            return res;
+          });
         },
       );
@@ -166,27 +197,24 @@ const webBatchFetchTool = defineTool({
       }
       const rawText = lines.join("\n");
-      const truncation = truncateHead(rawText, {
-        maxLines: DEFAULT_MAX_LINES,
-        maxBytes: DEFAULT_MAX_BYTES,
+      const sink = await writeWithFallback(rawText, {
+        tmpPrefix: "pi-web-batch-",
       });
+      fullOutputPath = sink.fullOutputPath;
-      let finalText = truncation.content;
-      if (truncation.truncated) {
-        const fullOutputDir = await fs.promises.mkdtemp(path.join(os.tmpdir(), "pi-web-batch-"));
-        fullOutputPath = path.join(fullOutputDir, "output.txt");
-        await fs.promises.writeFile(fullOutputPath, rawText, "utf-8");
-        finalText += `\n\n[Output truncated: ${truncation.outputLines} of ${truncation.totalLines} lines (${formatSize(truncation.outputBytes)} of ${formatSize(truncation.totalBytes)}). Full output saved to: ${fullOutputPath}]`;
-      }
-      onUpdate?.({ content: [{ type: "text", text: `Batch complete: ${successCount}/${results.length} succeeded` }], details: {} });
       return {
-        content: [{ type: "text", text: finalText }],
+        content: [{ type: "text", text: sink.text }],
         details: {
           urls: params.urls,
           succeeded: successCount,
           failed: results.length - successCount,
-          results: results.map((r) => ({ url: r.url, ok: r.ok, size: r.size })),
+          results: results.map((r) => ({
+            url: r.url,
+            ok: r.ok,
+            size: r.size,
+            preview: r.ok ? extractPreview(r.content, 200) : undefined,
+            error: r.error,
+          })),
           fullOutputPath,
         },
       };
@@ -206,40 +234,120 @@ const webBatchFetchTool = defineTool({
   renderCall(args, theme) {
     let text = theme.fg("toolTitle", theme.bold("web_batch_fetch "));
     text += theme.fg("muted", `${args.urls?.length ?? 0} URLs`);
+    if (args.max_concurrency) {
+      text += theme.fg("dim", ` concurrency=${args.max_concurrency}`);
+    }
     if (args.selector) {
       text += theme.fg("dim", ` selector=${args.selector}`);
     }
     return new Text(text, 0, 0);
   },
-  renderResult(result, { expanded, isPartial }, theme) {
+  renderResult(result, { expanded, isPartial }, theme, context) {
+    const isError = context?.isError ?? false;
     if (isPartial) {
+      const progress = (result.details as any)?.progress;
+      if (progress) {
+        const { total, completed, succeeded, failed, items } = progress;
+        const barWidth = 15;
+        const filled = Math.round((completed / total) * barWidth);
+        const bar = "█".repeat(filled) + "░".repeat(barWidth - filled);
+        let text = `${theme.fg("warning", "Batch fetching")}  [${theme.fg("accent", bar.slice(0, filled))}${theme.fg("dim", bar.slice(filled))}]  ${theme.fg("muted", `${completed}/${total}`)}`;
+        if (failed > 0) {
+          text += ` ${theme.fg("error", `(${failed} failed)`)}`;
+        }
+        for (const item of items) {
+          const icon = item.status === "done"
+            ? theme.fg("success", "✓")
+            : item.status === "error"
+              ? theme.fg("error", "✗")
+              : theme.fg("warning", "⏳");
+          let line = `\n  ${icon} ${theme.fg("dim", abbreviateUrl(item.url, 50))}`;
+          if (item.status === "done" && item.size > 0) {
+            line += theme.fg("muted", ` ${formatSize(item.size)}`);
+          } else if (item.status === "error" && item.error) {
+            const err = item.error.slice(0, 80);
+            line += theme.fg("dim", ` ${err}${item.error.length > 80 ? "..." : ""}`);
+          } else if (item.status === "fetching") {
+            line += theme.fg("muted", " fetching...");
+          }
+          text += line;
+        }
+        return new Text(text, 0, 0);
+      }
       return new Text(theme.fg("warning", "Batch fetching..."), 0, 0);
     }
     const details = result.details as {
       succeeded?: number;
       failed?: number;
       urls?: string[];
-      results?: Array<{ url: string; ok: boolean; size?: number }>;
+      results?: Array<{ url: string; ok: boolean; size?: number; preview?: string; error?: string }>;
       fullOutputPath?: string;
     } | undefined;
+    if (isError) {
+      const errText = getErrorText(result);
+      let text = theme.fg("error", "✗ Batch failed");
+      if (details?.urls) {
+        text += `  ${theme.fg("dim", `${details.urls.length} URLs`)}`;
+      }
+      text += `\n\n  ${theme.fg("toolOutput", errText)}`;
+      return new Text(text, 0, 0);
+    }
     const total = details?.urls?.length ?? 0;
     const ok = details?.succeeded ?? 0;
+    const failed = details?.failed ?? 0;
     let text = theme.fg("success", `✓ ${ok}/${total} fetched`);
-    if (details?.failed) {
-      text += theme.fg("error", ` (${details.failed} failed)`);
+    if (failed > 0) {
+      text += theme.fg("error", ` (${failed} failed)`);
     }
-    if (expanded && details?.results) {
-      for (const r of details.results) {
-        text += `\n  ${r.ok ? theme.fg("success", "✓") : theme.fg("error", "✗")} ${theme.fg("dim", r.url)}`;
-        if (r.size) {
-          text += theme.fg("muted", ` ${formatSize(r.size)}`);
+    if (!expanded) {
+      const successes = (details?.results ?? []).filter((r) => r.ok);
+      const top3 = successes.slice(0, 3);
+      for (let i = 0; i < top3.length; i++) {
+        const r = top3[i];
+        text += `\n  [${i + 1}] ${theme.fg("toolTitle", abbreviateUrl(r.url, 40))} ${theme.fg("muted", `(${formatSize(r.size ?? 0)})`)}`;
+        if (r.preview) {
+          const snippet = normalizeWhitespace(r.preview);
+          const short = snippet.length > 80 ? snippet.slice(0, 80).replace(/\s+\S*$/, "") + "..." : snippet;
+          text += `\n    ${theme.fg("muted", short)}`;
         }
       }
+      if (successes.length > 3) {
+        text += `\n  ${theme.fg("muted", `... and ${successes.length - 3} more (Ctrl+O for full list)`)}`;
+      }
     }
-    if (expanded && details?.fullOutputPath) {
-      text += `\n${theme.fg("dim", `Full output: ${details.fullOutputPath}`)}`;
+    if (expanded && details?.results) {
+      const successes = details.results.filter((r) => r.ok);
+      const failures = details.results.filter((r) => !r.ok);
+      for (let i = 0; i < successes.length; i++) {
+        const r = successes[i];
+        text += `\n[${i + 1}] ${theme.fg("toolTitle", abbreviateUrl(r.url))} ${theme.fg("muted", `| ${formatSize(r.size ?? 0)}`)}`;
+        if (r.preview) {
+          text += `\n    ${theme.fg("muted", normalizeWhitespace(r.preview))}`;
+        }
+        text += "\n";
+      }
+      if (failures.length > 0) {
+        text += `\n${theme.fg("error", "Failed:")}`;
+        for (const r of failures) {
+          text += `\n  ${theme.fg("error", "✗")} ${theme.fg("dim", r.url)} ${theme.fg("dim", r.error ?? "")}`;
+        }
+      }
+      if (details?.fullOutputPath) {
+        text += `\n\n${theme.fg("accent", `Full output: ${details.fullOutputPath}`)}`;
+      }
     }
     return new Text(text, 0, 0);
   },
 });