npm - @demigodmode/pi-web-agent - Versions diffs - 1.3.0 → 1.4.0 - Mend

@demigodmode/pi-web-agent 1.3.0 → 1.4.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/CHANGELOG.md +14 -0
package/dist/orchestration/answer-synthesizer.d.ts +3 -1
package/dist/orchestration/answer-synthesizer.js +34 -4
package/dist/orchestration/evidence-quality.d.ts +26 -0
package/dist/orchestration/evidence-quality.js +62 -0
package/dist/orchestration/index.d.ts +1 -0
package/dist/orchestration/research-orchestrator.d.ts +2 -0
package/dist/orchestration/research-orchestrator.js +45 -15
package/dist/orchestration/research-worker.js +12 -0
package/dist/orchestration/stop-decider.d.ts +3 -1
package/dist/orchestration/stop-decider.js +31 -3
package/dist/tools/web-explore.d.ts +1 -0
package/dist/tools/web-explore.js +2 -1
package/dist/types.d.ts +1 -0
package/package.json +1 -1

package/CHANGELOG.md CHANGED Viewed

@@ -18,6 +18,20 @@ The format is intentionally simple and release-oriented.
 ### Breaking
 - None.
+## [1.4.0] - 2026-06-09
+### Added
+- Added evidence quality analysis for `web_explore`, including source diversity, unreadable source, bot-check, and possible conflict signals.
+### Changed
+- `web_explore` now uses source quality signals before deciding whether to answer, search again, or answer with a caveat.
+- Partial research caveats are now more specific when evidence is community-only, low-diversity, blocked, or cautionary.
+### Fixed
+- Nothing yet.
+### Breaking
+- None.
 ## [1.3.0] - 2026-06-04
 ### Added
 - Added direct URL handling in `web_explore` so linked pages are read before search results.

package/dist/orchestration/answer-synthesizer.d.ts CHANGED Viewed

@@ -1,7 +1,9 @@
 import type { ResearchEvidence } from './research-types.js';
-export declare function synthesizeAnswer({ evidence, partial }: {
+import type { EvidenceCaveatReason } from './evidence-quality.js';
+export declare function synthesizeAnswer({ evidence, partial, caveatReasons }: {
     evidence: ResearchEvidence[];
     partial: boolean;
+    caveatReasons?: EvidenceCaveatReason[];
 }): {
     findings: string[];
     caveat: string | undefined;

package/dist/orchestration/answer-synthesizer.js CHANGED Viewed

@@ -1,7 +1,39 @@
 function normalizeSummary(summary) {
     return summary.replace(/\s+/g, ' ').trim();
 }
-export function synthesizeAnswer({ evidence, partial }) {
+function sentenceForReason(reason) {
+    switch (reason) {
+        case 'community-only':
+            return 'the strongest readable sources were mostly community/practical context';
+        case 'low-diversity':
+            return 'the source set was narrow';
+        case 'unreadable-direct-source':
+            return 'one or more linked sources could not be read reliably';
+        case 'unreadable-thread-source':
+            return 'one or more thread sources could not be read reliably';
+        case 'possible-conflict':
+            return 'readable sources include cautionary or possibly conflicting guidance';
+        case 'bot-check':
+            return 'some candidate sources showed bot-check or security verification pages';
+    }
+}
+function joinReasons(reasons) {
+    if (reasons.length === 0)
+        return '';
+    if (reasons.length === 1)
+        return reasons[0];
+    return `${reasons.slice(0, -1).join(', ')}, and ${reasons.at(-1)}`;
+}
+function caveatText(partial, caveatReasons = []) {
+    if (!partial)
+        return undefined;
+    const specificReasons = caveatReasons.map(sentenceForReason);
+    if (specificReasons.length > 0) {
+        return `Evidence is partial: ${joinReasons(specificReasons)}.`;
+    }
+    return 'Evidence is partial, so this answer is based on the strongest source found within the bounded research budget.';
+}
+export function synthesizeAnswer({ evidence, partial, caveatReasons = [] }) {
     const findings = evidence.slice(0, 5).map((item) => {
         const summary = normalizeSummary(item.summary);
         return item.sourceKind === 'community' || item.sourceKind === 'issue-thread'
@@ -10,8 +42,6 @@ export function synthesizeAnswer({ evidence, partial }) {
     });
     return {
         findings,
-        caveat: partial
-            ? 'Evidence is partial, so this answer is based on the strongest source found within the bounded research budget.'
-            : undefined
+        caveat: caveatText(partial, caveatReasons)
     };
 }

package/dist/orchestration/evidence-quality.d.ts ADDED Viewed

@@ -0,0 +1,26 @@
+import type { ResearchEvidence, ResearchGap, ResearchLowValueOutcome } from './research-types.js';
+export type EvidenceCaveatReason = 'community-only' | 'low-diversity' | 'unreadable-direct-source' | 'unreadable-thread-source' | 'possible-conflict' | 'bot-check';
+export type EvidenceQualityReport = {
+    counts: {
+        total: number;
+        official: number;
+        community: number;
+        thread: number;
+        packagePage: number;
+        distinctHosts: number;
+    };
+    flags: {
+        hasOfficialEvidence: boolean;
+        hasOnlyCommunityEvidence: boolean;
+        hasLowDiversity: boolean;
+        hasUnreadableDirectSource: boolean;
+        hasUnreadableThreadSource: boolean;
+        hasPossibleConflict: boolean;
+    };
+    caveatReasons: EvidenceCaveatReason[];
+};
+export declare function analyzeEvidenceQuality({ evidence, gaps, lowValueOutcomes }: {
+    evidence: ResearchEvidence[];
+    gaps: ResearchGap[];
+    lowValueOutcomes: ResearchLowValueOutcome[];
+}): EvidenceQualityReport;

package/dist/orchestration/evidence-quality.js ADDED Viewed

@@ -0,0 +1,62 @@
+function hostname(url) {
+    try {
+        return new URL(url).hostname.toLowerCase().replace(/^www\./, '');
+    }
+    catch {
+        return url.toLowerCase();
+    }
+}
+function hasConflictMarkers(evidence) {
+    const combined = evidence
+        .flatMap((item) => [item.summary, ...item.supports])
+        .join('\n')
+        .toLowerCase();
+    const caution = /\bdeprecated\b|not recommended|use at your own risk|should not/.test(combined);
+    const positiveText = combined.replace(/not recommended/g, '');
+    const positive = /\brecommended\b/.test(positiveText);
+    return positive && caution;
+}
+function addReason(reasons, reason, enabled) {
+    if (enabled && !reasons.includes(reason))
+        reasons.push(reason);
+}
+export function analyzeEvidenceQuality({ evidence, gaps, lowValueOutcomes }) {
+    const official = evidence.filter((item) => item.sourceKind === 'official-docs' || item.sourceKind === 'official-api').length;
+    const community = evidence.filter((item) => item.sourceKind === 'community').length;
+    const thread = evidence.filter((item) => item.sourceKind === 'issue-thread' || item.sourceKind === 'official-discussion').length;
+    const packagePage = evidence.filter((item) => item.sourceKind === 'package-page').length;
+    const distinctHosts = new Set(evidence.map((item) => hostname(item.url))).size;
+    const hasOfficialEvidence = official > 0;
+    const hasOnlyCommunityEvidence = evidence.length > 0 && official === 0;
+    const hasLowDiversity = evidence.length > 1 && distinctHosts <= 1;
+    const hasUnreadableDirectSource = gaps.some((gap) => /Direct URL could not be read reliably/i.test(gap.message));
+    const hasUnreadableThreadSource = gaps.some((gap) => /Thread source could not be read reliably/i.test(gap.message));
+    const hasPossibleConflict = hasConflictMarkers(evidence);
+    const hasBotCheck = lowValueOutcomes.some((outcome) => outcome.kind === 'bot-check');
+    const caveatReasons = [];
+    addReason(caveatReasons, 'community-only', hasOnlyCommunityEvidence);
+    addReason(caveatReasons, 'low-diversity', hasLowDiversity);
+    addReason(caveatReasons, 'unreadable-direct-source', hasUnreadableDirectSource);
+    addReason(caveatReasons, 'unreadable-thread-source', hasUnreadableThreadSource);
+    addReason(caveatReasons, 'possible-conflict', hasPossibleConflict);
+    addReason(caveatReasons, 'bot-check', hasBotCheck);
+    return {
+        counts: {
+            total: evidence.length,
+            official,
+            community,
+            thread,
+            packagePage,
+            distinctHosts
+        },
+        flags: {
+            hasOfficialEvidence,
+            hasOnlyCommunityEvidence,
+            hasLowDiversity,
+            hasUnreadableDirectSource,
+            hasUnreadableThreadSource,
+            hasPossibleConflict
+        },
+        caveatReasons
+    };
+}

package/dist/orchestration/index.d.ts CHANGED Viewed

@@ -23,6 +23,7 @@ export declare function createResearchWorkflow({ backendConfig, search, fetchPag
             fetchedPages: number;
             headlessAttempts: number;
             exhaustedBudget: boolean;
+            caveatReasons: import("./evidence-quality.js").EvidenceCaveatReason[];
         };
     }>;
 };

package/dist/orchestration/research-orchestrator.d.ts CHANGED Viewed

@@ -1,5 +1,6 @@
 import type { WebFetchHeadlessResponse, WebFetchResponse } from '../types.js';
 import type { ResearchEvidence, ResearchOrchestratorDecision, ResearchWorkerResult } from './research-types.js';
+import { type EvidenceCaveatReason } from './evidence-quality.js';
 export declare function createResearchOrchestrator({ worker, fetchDirect, headlessFetch }: {
     worker: {
         run: (input: {
@@ -26,6 +27,7 @@ export declare function createResearchOrchestrator({ worker, fetchDirect, headle
             fetchedPages: number;
             headlessAttempts: number;
             exhaustedBudget: boolean;
+            caveatReasons: EvidenceCaveatReason[];
         };
     }>;
 };

package/dist/orchestration/research-orchestrator.js CHANGED Viewed

@@ -3,6 +3,7 @@ import { planSearchQueries } from './query-planner.js';
 import { classifySourceProfile } from './source-profile.js';
 import { extractDirectUrls } from './direct-url.js';
 import { decideNextResearchStep } from './stop-decider.js';
+import { analyzeEvidenceQuality } from './evidence-quality.js';
 const DEFAULT_MAX_PASSES = 3;
 const DEFAULT_MAX_FETCHES_PER_PASS = 4;
 const DEFAULT_MAX_HEADLESS_ATTEMPTS = 2;
@@ -65,15 +66,16 @@ function shouldRetryDirectWithHeadless(result, evidence) {
         return false;
     return classifySourceProfile(result.url).shouldPreferHeadlessWhenWeak;
 }
-function buildMetadata({ previousQueries, allEvidence, allGaps, allLowValueOutcomes, headlessAttempts, exhaustedBudget }) {
+function buildMetadata({ previousQueries, allEvidence, allGaps, allLowValueOutcomes, headlessAttempts, exhaustedBudget, caveatReasons = [] }) {
     return {
         searchPasses: previousQueries.length,
         fetchedPages: allEvidence.length + allGaps.length + allLowValueOutcomes.length,
         headlessAttempts,
-        exhaustedBudget
+        exhaustedBudget,
+        caveatReasons
     };
 }
-function decisionForAnswer(action, query, ranked) {
+function decisionForAnswer({ action, query, ranked, exhaustedBudget }) {
     if (action === 'answer') {
         return {
             action: 'answer',
@@ -83,7 +85,7 @@ function decisionForAnswer(action, query, ranked) {
     }
     return {
         action: 'research-again',
-        rationale: 'Research budget exhausted; answer with caveat.',
+        rationale: exhaustedBudget ? 'Research budget exhausted; answer with caveat.' : 'Evidence has quality caveats; answer with caveat.',
         followupQuery: query
     };
 }
@@ -153,13 +155,19 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                     if (pass.suggestedHeadlessUrl)
                         suggestedHeadlessUrls.push(pass.suggestedHeadlessUrl);
                     const ranked = rankEvidence(allEvidence.filter((item) => item.sourceKind !== 'package-page'));
+                    const quality = analyzeEvidenceQuality({
+                        evidence: ranked,
+                        gaps: allGaps,
+                        lowValueOutcomes: allLowValueOutcomes
+                    });
                     const decision = decideNextResearchStep({
                         evidence: ranked,
                         suggestedHeadlessUrls,
                         passIndex,
                         maxPasses: DEFAULT_MAX_PASSES,
                         headlessAttempts,
-                        maxHeadlessAttempts: DEFAULT_MAX_HEADLESS_ATTEMPTS
+                        maxHeadlessAttempts: DEFAULT_MAX_HEADLESS_ATTEMPTS,
+                        quality
                     });
                     if (decision.action === 'headless') {
                         headlessAttempts++;
@@ -168,23 +176,35 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                         if (headlessEvidence) {
                             allEvidence.push(headlessEvidence);
                             const updatedRanked = rankEvidence(allEvidence.filter((item) => item.sourceKind !== 'package-page'));
+                            const updatedQuality = analyzeEvidenceQuality({
+                                evidence: updatedRanked,
+                                gaps: allGaps,
+                                lowValueOutcomes: allLowValueOutcomes
+                            });
                             const updatedDecision = decideNextResearchStep({
                                 evidence: updatedRanked,
                                 suggestedHeadlessUrls: [],
                                 passIndex,
                                 maxPasses: DEFAULT_MAX_PASSES,
                                 headlessAttempts,
-                                maxHeadlessAttempts: DEFAULT_MAX_HEADLESS_ATTEMPTS
+                                maxHeadlessAttempts: DEFAULT_MAX_HEADLESS_ATTEMPTS,
+                                quality: updatedQuality
                             });
+                            const exhaustedBudget = updatedDecision.action !== 'answer' && passIndex + 1 >= DEFAULT_MAX_PASSES;
                             return {
-                                decision: decisionForAnswer(updatedDecision.action === 'answer' ? 'answer' : 'answer-with-caveat', query, updatedRanked),
+                                decision: decisionForAnswer({
+                                    action: updatedDecision.action === 'answer' ? 'answer' : 'answer-with-caveat',
+                                    query,
+                                    ranked: updatedRanked,
+                                    exhaustedBudget
+                                }),
                                 evidence: updatedRanked,
                                 workerPass: combinedWorkerPass({
                                     lastPass,
                                     previousQueries,
                                     allGaps,
                                     allLowValueOutcomes,
-                                    exhaustedBudget: updatedDecision.action !== 'answer'
+                                    exhaustedBudget
                                 }),
                                 metadata: buildMetadata({
                                     previousQueries,
@@ -192,7 +212,8 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                                     allGaps,
                                     allLowValueOutcomes,
                                     headlessAttempts,
-                                    exhaustedBudget: updatedDecision.action !== 'answer'
+                                    exhaustedBudget,
+                                    caveatReasons: updatedQuality.caveatReasons
                                 })
                             };
                         }
@@ -217,20 +238,22 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                                 allGaps,
                                 allLowValueOutcomes,
                                 headlessAttempts,
-                                exhaustedBudget: false
+                                exhaustedBudget: false,
+                                caveatReasons: quality.caveatReasons
                             })
                         };
                     }
                     if (decision.action === 'answer' || decision.action === 'answer-with-caveat') {
+                        const exhaustedBudget = decision.action === 'answer-with-caveat' && passIndex + 1 >= DEFAULT_MAX_PASSES;
                         return {
-                            decision: decisionForAnswer(decision.action, query, ranked),
+                            decision: decisionForAnswer({ action: decision.action, query, ranked, exhaustedBudget }),
                             evidence: ranked,
                             workerPass: combinedWorkerPass({
                                 lastPass,
                                 previousQueries,
                                 allGaps,
                                 allLowValueOutcomes,
-                                exhaustedBudget: decision.action === 'answer-with-caveat'
+                                exhaustedBudget
                             }),
                             metadata: buildMetadata({
                                 previousQueries,
@@ -238,15 +261,21 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                                 allGaps,
                                 allLowValueOutcomes,
                                 headlessAttempts,
-                                exhaustedBudget: decision.action === 'answer-with-caveat'
+                                exhaustedBudget,
+                                caveatReasons: quality.caveatReasons
                             })
                         };
                     }
                 }
             }
             const ranked = rankEvidence(allEvidence.filter((item) => item.sourceKind !== 'package-page'));
+            const quality = analyzeEvidenceQuality({
+                evidence: ranked,
+                gaps: allGaps,
+                lowValueOutcomes: allLowValueOutcomes
+            });
             return {
-                decision: decisionForAnswer('answer-with-caveat', query, ranked),
+                decision: decisionForAnswer({ action: 'answer-with-caveat', query, ranked, exhaustedBudget: true }),
                 evidence: ranked,
                 workerPass: combinedWorkerPass({
                     lastPass,
@@ -261,7 +290,8 @@ export function createResearchOrchestrator({ worker, fetchDirect, headlessFetch
                     allGaps,
                     allLowValueOutcomes,
                     headlessAttempts,
-                    exhaustedBudget: true
+                    exhaustedBudget: true,
+                    caveatReasons: quality.caveatReasons
                 })
             };
         }

package/dist/orchestration/research-worker.js CHANGED Viewed

@@ -6,10 +6,15 @@ function classifySource(url) {
 function summarizeText(text, maxLength = 180) {
     return text.replace(/\s+/g, ' ').trim().slice(0, maxLength);
 }
+function isBotCheckContent({ title = '', text }) {
+    return /performing security verification|security service|verify you are not a bot|just a moment|checking your browser/i.test(`${title}\n${text}`);
+}
 function evidenceFromFetch(fetched, fallbackTitle) {
     const content = fetched.content;
     if (fetched.status !== 'ok' || !content)
         return null;
+    if (isBotCheckContent({ title: content.title, text: content.text }))
+        return null;
     const sourceKind = classifySource(fetched.url);
     if (sourceKind === 'package-page') {
         return null;
@@ -26,6 +31,13 @@ function evidenceFromFetch(fetched, fallbackTitle) {
 function lowValueOutcomeFromFetch(fetched) {
     if (fetched.status !== 'ok' || !fetched.content)
         return null;
+    if (isBotCheckContent({ title: fetched.content.title, text: fetched.content.text })) {
+        return {
+            kind: 'bot-check',
+            url: fetched.url,
+            message: 'Fetched page showed a bot-check or security verification page.'
+        };
+    }
     if (classifySource(fetched.url) !== 'package-page')
         return null;
     return {

package/dist/orchestration/stop-decider.d.ts CHANGED Viewed

@@ -1,4 +1,5 @@
 import type { ResearchEvidence } from './research-types.js';
+import type { EvidenceQualityReport } from './evidence-quality.js';
 export type ResearchStepDecision = {
     action: 'answer';
 } | {
@@ -9,11 +10,12 @@ export type ResearchStepDecision = {
     action: 'headless';
     url: string;
 };
-export declare function decideNextResearchStep({ evidence, suggestedHeadlessUrls, passIndex, maxPasses, headlessAttempts, maxHeadlessAttempts }: {
+export declare function decideNextResearchStep({ evidence, suggestedHeadlessUrls, passIndex, maxPasses, headlessAttempts, maxHeadlessAttempts, quality }: {
     evidence: ResearchEvidence[];
     suggestedHeadlessUrls: string[];
     passIndex: number;
     maxPasses: number;
     headlessAttempts: number;
     maxHeadlessAttempts: number;
+    quality?: EvidenceQualityReport;
 }): ResearchStepDecision;

package/dist/orchestration/stop-decider.js CHANGED Viewed

@@ -1,7 +1,35 @@
 import { hasOfficialEvidence, strongEvidenceCount } from './evidence-ranker.js';
-export function decideNextResearchStep({ evidence, suggestedHeadlessUrls, passIndex, maxPasses, headlessAttempts, maxHeadlessAttempts }) {
-    if (strongEvidenceCount(evidence) >= 2 && hasOfficialEvidence(evidence)) {
-        return { action: 'answer' };
+function activeCaveatReasons(evidence, quality) {
+    const reasons = quality?.caveatReasons ?? [];
+    if (!hasOfficialDocsAndApi(evidence))
+        return reasons;
+    return reasons.filter((reason) => reason !== 'low-diversity');
+}
+function hasQualityConcern(evidence, quality) {
+    return activeCaveatReasons(evidence, quality).length > 0;
+}
+function hasOfficialDocsAndApi(evidence) {
+    return evidence.some((item) => item.sourceKind === 'official-docs') &&
+        evidence.some((item) => item.sourceKind === 'official-api');
+}
+function shouldSearchForBetterQuality({ evidence, quality, passIndex, maxPasses }) {
+    if (!quality)
+        return false;
+    if (passIndex + 1 >= maxPasses)
+        return false;
+    if (quality.flags.hasOnlyCommunityEvidence)
+        return true;
+    if (quality.flags.hasLowDiversity && !hasOfficialDocsAndApi(evidence))
+        return true;
+    return false;
+}
+export function decideNextResearchStep({ evidence, suggestedHeadlessUrls, passIndex, maxPasses, headlessAttempts, maxHeadlessAttempts, quality }) {
+    const strongEnough = strongEvidenceCount(evidence) >= 2 && hasOfficialEvidence(evidence);
+    if (strongEnough && shouldSearchForBetterQuality({ evidence, quality, passIndex, maxPasses })) {
+        return { action: 'search-again' };
+    }
+    if (strongEnough) {
+        return hasQualityConcern(evidence, quality) ? { action: 'answer-with-caveat' } : { action: 'answer' };
     }
     const headlessUrl = suggestedHeadlessUrls.find((url) => !url.includes('npmjs.com/package/'));
     if (headlessUrl && headlessAttempts < maxHeadlessAttempts) {

package/dist/tools/web-explore.d.ts CHANGED Viewed

@@ -39,6 +39,7 @@ export declare function createWebExploreTool({ explore }?: {
         fetchedPages: number;
         headlessAttempts: number;
         exhaustedBudget: boolean;
+        caveatReasons?: string[];
     };
     error?: import("../types.js").ToolError;
 }>;

package/dist/tools/web-explore.js CHANGED Viewed

@@ -25,7 +25,8 @@ export function createWebExploreTool({ explore = createResearchWorkflow() } = {}
         }));
         const synthesized = synthesizeAnswer({
             evidence: result.evidence,
-            partial: result.decision.action !== 'answer'
+            partial: result.decision.action !== 'answer',
+            caveatReasons: result.metadata?.caveatReasons
         });
         const shaped = {
             status: 'ok',

package/dist/types.d.ts CHANGED Viewed

@@ -68,6 +68,7 @@ export type WebExploreResponse = {
         fetchedPages: number;
         headlessAttempts: number;
         exhaustedBudget: boolean;
+        caveatReasons?: string[];
     };
     presentation?: PresentationEnvelope;
     error?: ToolError;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@demigodmode/pi-web-agent",
-  "version": "1.3.0",
+  "version": "1.4.0",
   "description": "Pi package for reliable web access with explicit search, fetch, and headless boundaries.",
   "type": "module",
   "main": "./dist/extension.js",