npm - @demigodmode/pi-web-agent - Versions diffs - 1.2.0 → 1.3.0 - Mend

@demigodmode/pi-web-agent 1.2.0 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/CHANGELOG.md +16 -0
package/README.md +4 -4
package/dist/backends/doctor.js +3 -0
package/dist/fetch/headless-fetch.d.ts +2 -1
package/dist/fetch/headless-fetch.js +11 -7
package/dist/orchestration/candidate-selector.d.ts +2 -1
package/dist/orchestration/candidate-selector.js +28 -9
package/dist/orchestration/direct-url.d.ts +1 -0
package/dist/orchestration/direct-url.js +47 -0
package/dist/orchestration/index.js +5 -1
package/dist/orchestration/research-orchestrator.d.ts +5 -2
package/dist/orchestration/research-orchestrator.js +97 -27
package/dist/orchestration/research-worker.js +3 -13
package/dist/orchestration/source-profile.d.ts +8 -0
package/dist/orchestration/source-profile.js +60 -0
package/package.json +2 -2

package/CHANGELOG.md CHANGED Viewed

@@ -18,6 +18,22 @@ The format is intentionally simple and release-oriented.
 ### Breaking
 - None.
+## [1.3.0] - 2026-06-04
+### Added
+- Added direct URL handling in `web_explore` so linked pages are read before search results.
+- Added forum/thread source classification for Reddit-style discussions, forums, Stack Overflow, and GitHub issues/discussions.
+- Added Playwright-managed Chromium fallback when no local Chromium-family browser is detected.
+### Changed
+- Discussion-oriented queries now prefer forum/thread results over generic pages.
+- `/web-agent doctor` now reports the local-browser headless backend and managed Chromium fallback.
+### Fixed
+- Preserved direct/thread fetch gaps in bounded research results so unreadable thread sources get explicit caveats.
+### Breaking
+- None.
 ## [1.2.0] - 2026-06-01
 ### Added
 - Added backend provider and fallback editing to `/web-agent settings`.

package/README.md CHANGED Viewed

@@ -8,7 +8,7 @@
 Most agent web tools blur search, fetch, browser rendering, and research into one vague thing. `pi-web-agent` exposes one public research tool, `web_explore`, and keeps search/fetch/headless work inside that bounded workflow.
-The point is keeping the model-facing boundary simple: ask `web_explore` to research a question, and it handles discovery, HTTP reads, targeted browser rendering, source ranking, and caveats internally.
+The point is keeping the model-facing boundary simple: ask `web_explore` to research a question, and it handles direct links, discovery, HTTP reads, targeted browser rendering, source ranking, and caveats internally.
 That sounds obvious, but a lot of agent tooling gets fuzzy right there. This package is meant to be stricter about what it actually did and more willing to say when a read was not good enough to trust.
@@ -20,9 +20,9 @@ Compatibility notice: current `pi-web-agent` requires Pi 0.74+ because Pi packag
 pi install npm:@demigodmode/pi-web-agent
 ```
-After installing, reload or restart Pi. Run `/web-agent` for the action menu, or `/web-agent doctor` to check whether the package loaded cleanly and whether headless rendering can find a browser.
+After installing, reload or restart Pi. Run `/web-agent` for the action menu, or `/web-agent doctor` to check whether the package loaded cleanly and which web backends are configured.
-Headless rendering currently requires a detectable Chromium-family browser: Chrome, Chromium, Edge, or Brave. Firefox/Safari-only systems can still use search and plain HTTP reads, but browser-rendered fallback pages need a supported Chromium-family browser for now.
+Headless rendering first tries a detectable Chromium-family browser: Chrome, Chromium, Edge, or Brave. If none is found, it falls back to Playwright-managed Chromium and still launches headless. Firefox/Safari-only systems can still use search and plain HTTP reads; browser-rendered fallback uses Chromium.
 Later on, update installed packages with:
@@ -109,7 +109,7 @@ Example:
 }
 ```
-Backend config is also supported. Defaults remain DuckDuckGo search, plain HTTP fetch, and local browser headless fallback.
+Backend config is also supported. Defaults remain DuckDuckGo search, plain HTTP fetch, and local-browser headless fallback with managed Chromium fallback configured.
 Backend settings can be changed from:

package/dist/backends/doctor.js CHANGED Viewed

@@ -83,5 +83,8 @@ export async function checkBackendHealth(config, { fetchImpl = fetch, timeoutMs
     if (config.fetch.fallback) {
         lines.push(`fetch fallback: ${config.fetch.fallback}`);
     }
+    if (config.headless.provider === 'local-browser') {
+        lines.push('headless backend: local-browser (managed Chromium fallback configured)');
+    }
     return lines;
 }

package/dist/fetch/headless-fetch.d.ts CHANGED Viewed

@@ -6,7 +6,8 @@ export declare function headlessFetch(url: string, { configuredPath, resolveBrow
         configuredPath?: string;
     }) => Promise<BrowserResolutionResult>;
     launchBrowser?: (options: {
-        executablePath: string;
+        executablePath?: string;
+        headless: true;
     }) => Promise<{
         newContext: () => Promise<{
             newPage: () => Promise<any>;

package/dist/fetch/headless-fetch.js CHANGED Viewed

@@ -1,4 +1,4 @@
-import { chromium } from 'playwright-core';
+import { chromium } from 'playwright';
 import { extractReadableContentSafely } from '../extract/readability.js';
 import { resolveBrowserExecutable } from './browser-resolution.js';
 function cleanupRenderedText(text) {
@@ -7,9 +7,9 @@ function cleanupRenderedText(text) {
     cleaned = cleaned.replace(/\s+/g, ' ').trim();
     return cleaned;
 }
-export async function headlessFetch(url, { configuredPath, resolveBrowser = (options) => resolveBrowserExecutable({ configuredPath: options?.configuredPath }), launchBrowser = ({ executablePath }) => chromium.launch({ executablePath, headless: true }), now = () => Date.now() } = {}) {
+export async function headlessFetch(url, { configuredPath, resolveBrowser = (options) => resolveBrowserExecutable({ configuredPath: options?.configuredPath }), launchBrowser = ({ executablePath, headless }) => chromium.launch(executablePath ? { executablePath, headless } : { headless }), now = () => Date.now() } = {}) {
     const resolved = await resolveBrowser({ configuredPath });
-    if (!resolved.ok) {
+    if (!resolved.ok && resolved.error.code === 'CONFIGURED_BROWSER_NOT_FOUND') {
         return {
             status: 'error',
             url,
@@ -17,11 +17,15 @@ export async function headlessFetch(url, { configuredPath, resolveBrowser = (opt
             error: resolved.error
         };
     }
+    const browserName = resolved.ok ? resolved.browser : 'chromium';
+    const launchOptions = resolved.ok
+        ? { executablePath: resolved.executablePath, headless: true }
+        : { headless: true };
     let browser;
     let context;
     let page;
     try {
-        browser = await launchBrowser({ executablePath: resolved.executablePath });
+        browser = await launchBrowser(launchOptions);
         context = await browser.newContext();
         page = await context.newPage();
         const startedAt = now();
@@ -42,7 +46,7 @@ export async function headlessFetch(url, { configuredPath, resolveBrowser = (opt
                 metadata: {
                     method: 'headless',
                     cacheHit: false,
-                    browser: resolved.browser,
+                    browser: browserName,
                     navigationMs: finishedAt - startedAt
                 },
                 error: {
@@ -58,7 +62,7 @@ export async function headlessFetch(url, { configuredPath, resolveBrowser = (opt
             metadata: {
                 method: 'headless',
                 cacheHit: false,
-                browser: resolved.browser,
+                browser: browserName,
                 navigationMs: finishedAt - startedAt,
                 truncated: cleanedContent.text.length >= 4000
             }
@@ -71,7 +75,7 @@ export async function headlessFetch(url, { configuredPath, resolveBrowser = (opt
             metadata: {
                 method: 'headless',
                 cacheHit: false,
-                browser: resolved.browser
+                browser: browserName
             },
             error: {
                 code: 'HEADLESS_NAVIGATION_FAILED',

package/dist/orchestration/candidate-selector.d.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 import type { SearchResult } from '../types.js';
-export declare function selectCandidates({ results, seenUrls, maxCandidates }: {
+export declare function selectCandidates({ query, results, seenUrls, maxCandidates }: {
+    query?: string;
     results: SearchResult[];
     seenUrls: Set<string>;
     maxCandidates: number;

package/dist/orchestration/candidate-selector.js CHANGED Viewed

@@ -1,16 +1,35 @@
-function candidateScore(result) {
+import { classifySourceProfile } from './source-profile.js';
+function wantsDiscussionSources(query = '') {
+    return /reddit|forum|forums|discussion|thread|comments|community|user experience|people recommend/i.test(query);
+}
+function candidateScore(result, query) {
     const url = result.url.toLowerCase();
-    if (url.includes('playwright.dev/docs') || url.includes('vitest.dev/guide') || url.includes('learn.microsoft.com'))
+    const profile = classifySourceProfile(result.url);
+    const wantsThreads = wantsDiscussionSources(query);
+    if (profile.kind === 'official-docs')
         return 0;
-    if (url.includes('github.com/') && (url.includes('/issues/') || url.includes('/discussions/')))
+    if (profile.kind === 'official-api')
         return 1;
-    if (url.includes('github.com/'))
+    if (wantsThreads) {
+        if (profile.kind === 'forum-thread')
+            return 2;
+        if (profile.kind === 'issue-thread')
+            return 3;
+        if (url.includes('github.com/'))
+            return 4;
+        if (profile.kind === 'package-page')
+            return 6;
+        return 5;
+    }
+    if (profile.kind === 'issue-thread')
         return 2;
-    if (url.includes('npmjs.com/package/'))
-        return 4;
-    return 3;
+    if (url.includes('github.com/'))
+        return 3;
+    if (profile.kind === 'package-page')
+        return 5;
+    return 4;
 }
-export function selectCandidates({ results, seenUrls, maxCandidates }) {
+export function selectCandidates({ query, results, seenUrls, maxCandidates }) {
     const deduped = new Map();
     for (const result of results) {
         if (seenUrls.has(result.url))
@@ -19,6 +38,6 @@ export function selectCandidates({ results, seenUrls, maxCandidates }) {
             deduped.set(result.url, result);
     }
     return [...deduped.values()]
-        .sort((left, right) => candidateScore(left) - candidateScore(right))
+        .sort((left, right) => candidateScore(left, query) - candidateScore(right, query))
         .slice(0, maxCandidates);
 }

package/dist/orchestration/direct-url.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export declare function extractDirectUrls(query: string): string[];

package/dist/orchestration/direct-url.js ADDED Viewed

@@ -0,0 +1,47 @@
+const TRACKING_PARAMS = new Set([
+    'utm_source',
+    'utm_medium',
+    'utm_campaign',
+    'utm_term',
+    'utm_content',
+    'utm_name',
+    'fbclid',
+    'gclid'
+]);
+function stripTrailingPunctuation(raw) {
+    let next = raw.trim();
+    while (/[),.;!?\]]$/.test(next)) {
+        const last = next.at(-1);
+        if (last === ')' && next.includes('(') && next.lastIndexOf('(') > next.lastIndexOf(')'))
+            break;
+        next = next.slice(0, -1);
+    }
+    return next;
+}
+function normalizeDirectUrl(raw) {
+    try {
+        const url = new URL(stripTrailingPunctuation(raw));
+        if (url.protocol !== 'http:' && url.protocol !== 'https:')
+            return undefined;
+        for (const key of [...url.searchParams.keys()]) {
+            if (TRACKING_PARAMS.has(key.toLowerCase())) {
+                url.searchParams.delete(key);
+            }
+        }
+        url.hash = '';
+        return url.toString().replace(/\/$/, '');
+    }
+    catch {
+        return undefined;
+    }
+}
+export function extractDirectUrls(query) {
+    const matches = query.match(/https?:\/\/\S+/gi) ?? [];
+    const urls = new Set();
+    for (const match of matches) {
+        const normalized = normalizeDirectUrl(match);
+        if (normalized)
+            urls.add(normalized);
+    }
+    return [...urls];
+}

package/dist/orchestration/index.js CHANGED Viewed

@@ -7,5 +7,9 @@ export function createResearchWorkflow({ backendConfig, search, fetchPage, headl
     const resolvedFetchPage = fetchPage ?? backends.fetchPage;
     const resolvedHeadlessFetch = headlessFetch ?? backends.headlessFetch;
     const worker = createResearchWorker({ search: resolvedSearch, fetchPage: resolvedFetchPage });
-    return createResearchOrchestrator({ worker, headlessFetch: resolvedHeadlessFetch });
+    return createResearchOrchestrator({
+        worker,
+        fetchDirect: resolvedFetchPage,
+        headlessFetch: resolvedHeadlessFetch
+    });
 }

package/dist/orchestration/research-orchestrator.d.ts CHANGED Viewed

@@ -1,6 +1,6 @@
-import type { WebFetchHeadlessResponse } from '../types.js';
+import type { WebFetchHeadlessResponse, WebFetchResponse } from '../types.js';
 import type { ResearchEvidence, ResearchOrchestratorDecision, ResearchWorkerResult } from './research-types.js';
-export declare function createResearchOrchestrator({ worker, headlessFetch }: {
+export declare function createResearchOrchestrator({ worker, fetchDirect, headlessFetch }: {
     worker: {
         run: (input: {
             query: string;
@@ -8,6 +8,9 @@ export declare function createResearchOrchestrator({ worker, headlessFetch }: {
             maxFetches: number;
         }) => Promise<ResearchWorkerResult>;
     };
+    fetchDirect?: (input: {
+        url: string;
+    }) => Promise<WebFetchResponse>;
     headlessFetch: (input: {
         url: string;
     }) => Promise<WebFetchHeadlessResponse>;

package/dist/orchestration/research-orchestrator.js CHANGED Viewed

@@ -1,23 +1,13 @@
 import { rankEvidence } from './evidence-ranker.js';
 import { planSearchQueries } from './query-planner.js';
+import { classifySourceProfile } from './source-profile.js';
+import { extractDirectUrls } from './direct-url.js';
 import { decideNextResearchStep } from './stop-decider.js';
 const DEFAULT_MAX_PASSES = 3;
 const DEFAULT_MAX_FETCHES_PER_PASS = 4;
 const DEFAULT_MAX_HEADLESS_ATTEMPTS = 2;
 function classifyEvidenceUrl(url) {
-    if (url.includes('/docs/api/') || url.includes('/config/'))
-        return 'official-api';
-    if (url.includes('playwright.dev/docs') || url.includes('vitest.dev/guide/'))
-        return 'official-docs';
-    if (url.includes('github.com/vitest-dev/vitest') && url.includes('/docs/'))
-        return 'official-docs';
-    if (url.includes('learn.microsoft.com'))
-        return 'official-docs';
-    if (url.includes('github.com/') && url.includes('/issues/'))
-        return 'issue-thread';
-    if (url.includes('npmjs.com/package/'))
-        return 'package-page';
-    return 'community';
+    return classifySourceProfile(url).sourceKind;
 }
 function summarizeText(text, maxLength = 180) {
     return text.replace(/\s+/g, ' ').trim().slice(0, maxLength);
@@ -25,6 +15,20 @@ function summarizeText(text, maxLength = 180) {
 function isBotCheckContent({ title = '', text }) {
     return /performing security verification|security service|verify you are not a bot|just a moment|checking your browser/i.test(`${title}\n${text}`);
 }
+function evidenceFromFetch(result) {
+    if (result.status !== 'ok' || !result.content?.text.trim())
+        return null;
+    if (isBotCheckContent({ title: result.content.title, text: result.content.text }))
+        return null;
+    return {
+        title: result.content.title ?? result.url,
+        url: result.url,
+        sourceKind: classifyEvidenceUrl(result.url),
+        method: result.metadata.method,
+        summary: summarizeText(result.content.text),
+        supports: [summarizeText(result.content.text, 120)]
+    };
+}
 function evidenceFromHeadless(result) {
     if (result.status !== 'ok' || !result.content?.text.trim())
         return null;
@@ -39,15 +43,28 @@ function evidenceFromHeadless(result) {
         supports: [summarizeText(result.content.text, 120)]
     };
 }
-function fallbackWorkerPass({ previousQueries, allGaps, allLowValueOutcomes, exhaustedBudget }) {
+function combinedWorkerPass({ lastPass, previousQueries, allGaps, allLowValueOutcomes, exhaustedBudget }) {
     return {
-        searchQueries: previousQueries,
-        evidence: [],
+        searchQueries: lastPass?.searchQueries ?? previousQueries,
+        evidence: lastPass?.evidence ?? [],
         gaps: allGaps,
         lowValueOutcomes: allLowValueOutcomes,
+        suggestedHeadlessUrl: lastPass?.suggestedHeadlessUrl,
         exhaustedBudget
     };
 }
+function directUnreadableMessage(url) {
+    return classifySourceProfile(url).kind === 'forum-thread'
+        ? `Thread source could not be read reliably: ${url}`
+        : `Direct URL could not be read reliably: ${url}`;
+}
+function shouldRetryDirectWithHeadless(result, evidence) {
+    if (result.status === 'needs_headless')
+        return true;
+    if (result.status !== 'ok' || evidence)
+        return false;
+    return classifySourceProfile(result.url).shouldPreferHeadlessWhenWeak;
+}
 function buildMetadata({ previousQueries, allEvidence, allGaps, allLowValueOutcomes, headlessAttempts, exhaustedBudget }) {
     return {
         searchPasses: previousQueries.length,
@@ -70,7 +87,7 @@ function decisionForAnswer(action, query, ranked) {
         followupQuery: query
     };
 }
-export function createResearchOrchestrator({ worker, headlessFetch }) {
+export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch }) {
     return {
         async run({ query }) {
             const allEvidence = [];
@@ -80,6 +97,41 @@ export function createResearchOrchestrator({ worker, headlessFetch }) {
             const suggestedHeadlessUrls = [];
             let headlessAttempts = 0;
             let lastPass;
+            if (fetchDirect) {
+                for (const url of extractDirectUrls(query).slice(0, 3)) {
+                    const directResult = await fetchDirect({ url });
+                    const directEvidence = evidenceFromFetch(directResult);
+                    if (directEvidence) {
+                        allEvidence.push(directEvidence);
+                        continue;
+                    }
+                    if (shouldRetryDirectWithHeadless(directResult, directEvidence)) {
+                        if (headlessAttempts < DEFAULT_MAX_HEADLESS_ATTEMPTS) {
+                            headlessAttempts++;
+                            const headlessResult = await headlessFetch({ url: directResult.url });
+                            const headlessEvidence = evidenceFromHeadless(headlessResult);
+                            if (headlessEvidence) {
+                                allEvidence.push(headlessEvidence);
+                            }
+                            else {
+                                allGaps.push({ kind: 'fetch-failed', message: directUnreadableMessage(directResult.url) });
+                            }
+                        }
+                        else {
+                            allGaps.push({ kind: 'fetch-failed', message: directUnreadableMessage(directResult.url) });
+                        }
+                    }
+                    else if (directResult.status !== 'ok') {
+                        allGaps.push({
+                            kind: 'fetch-failed',
+                            message: directResult.error?.message ?? `Direct URL fetch failed for ${directResult.url}`
+                        });
+                    }
+                    else {
+                        allGaps.push({ kind: 'fetch-failed', message: directUnreadableMessage(directResult.url) });
+                    }
+                }
+            }
             for (let passIndex = 0; passIndex < DEFAULT_MAX_PASSES; passIndex++) {
                 const queries = planSearchQueries({
                     originalQuery: query,
@@ -127,7 +179,13 @@ export function createResearchOrchestrator({ worker, headlessFetch }) {
                             return {
                                 decision: decisionForAnswer(updatedDecision.action === 'answer' ? 'answer' : 'answer-with-caveat', query, updatedRanked),
                                 evidence: updatedRanked,
-                                workerPass: lastPass,
+                                workerPass: combinedWorkerPass({
+                                    lastPass,
+                                    previousQueries,
+                                    allGaps,
+                                    allLowValueOutcomes,
+                                    exhaustedBudget: updatedDecision.action !== 'answer'
+                                }),
                                 metadata: buildMetadata({
                                     previousQueries,
                                     allEvidence,
@@ -146,7 +204,13 @@ export function createResearchOrchestrator({ worker, headlessFetch }) {
                                 approvedEvidence: ranked
                             },
                             evidence: ranked,
-                            workerPass: lastPass,
+                            workerPass: combinedWorkerPass({
+                                lastPass,
+                                previousQueries,
+                                allGaps,
+                                allLowValueOutcomes,
+                                exhaustedBudget: false
+                            }),
                             metadata: buildMetadata({
                                 previousQueries,
                                 allEvidence,
@@ -161,7 +225,13 @@ export function createResearchOrchestrator({ worker, headlessFetch }) {
                         return {
                             decision: decisionForAnswer(decision.action, query, ranked),
                             evidence: ranked,
-                            workerPass: lastPass,
+                            workerPass: combinedWorkerPass({
+                                lastPass,
+                                previousQueries,
+                                allGaps,
+                                allLowValueOutcomes,
+                                exhaustedBudget: decision.action === 'answer-with-caveat'
+                            }),
                             metadata: buildMetadata({
                                 previousQueries,
                                 allEvidence,
@@ -178,13 +248,13 @@ export function createResearchOrchestrator({ worker, headlessFetch }) {
             return {
                 decision: decisionForAnswer('answer-with-caveat', query, ranked),
                 evidence: ranked,
-                workerPass: lastPass ??
-                    fallbackWorkerPass({
-                        previousQueries,
-                        allGaps,
-                        allLowValueOutcomes,
-                        exhaustedBudget: true
-                    }),
+                workerPass: combinedWorkerPass({
+                    lastPass,
+                    previousQueries,
+                    allGaps,
+                    allLowValueOutcomes,
+                    exhaustedBudget: true
+                }),
                 metadata: buildMetadata({
                     previousQueries,
                     allEvidence,

package/dist/orchestration/research-worker.js CHANGED Viewed

@@ -1,18 +1,7 @@
 import { selectCandidates } from './candidate-selector.js';
+import { classifySourceProfile } from './source-profile.js';
 function classifySource(url) {
-    if (url.includes('/docs/api/') || url.includes('/config/'))
-        return 'official-api';
-    if (url.includes('playwright.dev/docs') || url.includes('vitest.dev/guide/'))
-        return 'official-docs';
-    if (url.includes('github.com/vitest-dev/vitest') && url.includes('/docs/'))
-        return 'official-docs';
-    if (url.includes('learn.microsoft.com'))
-        return 'official-docs';
-    if (url.includes('github.com/') && url.includes('/issues/'))
-        return 'issue-thread';
-    if (url.includes('npmjs.com/package/'))
-        return 'package-page';
-    return 'community';
+    return classifySourceProfile(url).sourceKind;
 }
 function summarizeText(text, maxLength = 180) {
     return text.replace(/\s+/g, ' ').trim().slice(0, maxLength);
@@ -95,6 +84,7 @@ export function createResearchWorker({ search, fetchPage }) {
                 };
             }
             const candidates = selectCandidates({
+                query,
                 results: searchResult.results,
                 seenUrls: new Set(evidence.map((item) => item.url)),
                 maxCandidates: maxFetches

package/dist/orchestration/source-profile.d.ts ADDED Viewed

@@ -0,0 +1,8 @@
+import type { ResearchSourceKind } from './research-types.js';
+export type SourceProfileKind = 'official-docs' | 'official-api' | 'issue-thread' | 'forum-thread' | 'package-page' | 'community';
+export type SourceProfile = {
+    kind: SourceProfileKind;
+    sourceKind: ResearchSourceKind;
+    shouldPreferHeadlessWhenWeak: boolean;
+};
+export declare function classifySourceProfile(rawUrl: string): SourceProfile;

package/dist/orchestration/source-profile.js ADDED Viewed

@@ -0,0 +1,60 @@
+const COMMUNITY_FORUM_HOST_RE = /(^|\.)(community|forum|forums|discuss|discourse)\./;
+function profile(kind, sourceKind, shouldPreferHeadlessWhenWeak) {
+    return { kind, sourceKind, shouldPreferHeadlessWhenWeak };
+}
+function parseUrl(rawUrl) {
+    try {
+        return new URL(rawUrl);
+    }
+    catch {
+        return undefined;
+    }
+}
+function isOfficialApi(host, path) {
+    return ((host === 'playwright.dev' && path.startsWith('/docs/api/')) ||
+        (host === 'vitest.dev' && path.startsWith('/config/')));
+}
+function isOfficialDocs(host, path) {
+    return ((host === 'playwright.dev' && path.startsWith('/docs/')) ||
+        (host === 'vitest.dev' && path.startsWith('/guide/')) ||
+        (host === 'github.com' && path.startsWith('/vitest-dev/vitest/') && path.includes('/docs/')) ||
+        host === 'learn.microsoft.com');
+}
+function isIssueThread(host, path) {
+    return host === 'github.com' && (path.includes('/issues/') || path.includes('/discussions/'));
+}
+function hasForumThreadPath(path) {
+    return (path.includes('/forum/') ||
+        path.includes('/forums/') ||
+        path.includes('/t/') ||
+        path.includes('/topic/') ||
+        path.includes('/threads/'));
+}
+function isForumThread(host, path) {
+    return ((host === 'reddit.com' && path.includes('/comments/')) ||
+        (host === 'stackoverflow.com' && path.startsWith('/questions/')) ||
+        (COMMUNITY_FORUM_HOST_RE.test(`${host}.`) && hasForumThreadPath(path)));
+}
+export function classifySourceProfile(rawUrl) {
+    const parsed = parseUrl(rawUrl);
+    if (!parsed)
+        return profile('community', 'community', false);
+    const host = parsed.hostname.toLowerCase().replace(/^www\./, '');
+    const path = parsed.pathname.toLowerCase();
+    if (isOfficialApi(host, path)) {
+        return profile('official-api', 'official-api', false);
+    }
+    if (isOfficialDocs(host, path)) {
+        return profile('official-docs', 'official-docs', false);
+    }
+    if (isIssueThread(host, path)) {
+        return profile('issue-thread', 'issue-thread', true);
+    }
+    if (isForumThread(host, path)) {
+        return profile('forum-thread', 'community', true);
+    }
+    if (host === 'npmjs.com' && path.startsWith('/package/')) {
+        return profile('package-page', 'package-page', false);
+    }
+    return profile('community', 'community', false);
+}

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@demigodmode/pi-web-agent",
-  "version": "1.2.0",
+  "version": "1.3.0",
   "description": "Pi package for reliable web access with explicit search, fetch, and headless boundaries.",
   "type": "module",
   "main": "./dist/extension.js",
@@ -57,7 +57,7 @@
     "@mozilla/readability": "^0.6.0",
     "cheerio": "^1.1.0",
     "jsdom": "^26.0.0",
-    "playwright-core": "^1.54.0",
+    "playwright": "^1.60.0",
     "typebox": "^1.1.37"
   },
   "devDependencies": {