npm - webpeel - Versions diffs - 0.7.0 → 0.7.1 - Mend

webpeel 0.7.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (72) hide show

package/README.md +140 -500
package/dist/cli-auth.d.ts +2 -0
package/dist/cli-auth.d.ts.map +1 -1
package/dist/cli-auth.js +16 -3
package/dist/cli-auth.js.map +1 -1
package/dist/cli.js +475 -77
package/dist/cli.js.map +1 -1
package/dist/core/actions.d.ts +19 -10
package/dist/core/actions.d.ts.map +1 -1
package/dist/core/actions.js +214 -43
package/dist/core/actions.js.map +1 -1
package/dist/core/agent.d.ts +60 -3
package/dist/core/agent.d.ts.map +1 -1
package/dist/core/agent.js +375 -86
package/dist/core/agent.js.map +1 -1
package/dist/core/answer.d.ts +43 -0
package/dist/core/answer.d.ts.map +1 -0
package/dist/core/answer.js +378 -0
package/dist/core/answer.js.map +1 -0
package/dist/core/cache.d.ts +14 -0
package/dist/core/cache.d.ts.map +1 -0
package/dist/core/cache.js +122 -0
package/dist/core/cache.js.map +1 -0
package/dist/core/dns-cache.d.ts +21 -0
package/dist/core/dns-cache.d.ts.map +1 -0
package/dist/core/dns-cache.js +184 -0
package/dist/core/dns-cache.js.map +1 -0
package/dist/core/documents.d.ts +24 -0
package/dist/core/documents.d.ts.map +1 -0
package/dist/core/documents.js +124 -0
package/dist/core/documents.js.map +1 -0
package/dist/core/extract-inline.d.ts +39 -0
package/dist/core/extract-inline.d.ts.map +1 -0
package/dist/core/extract-inline.js +214 -0
package/dist/core/extract-inline.js.map +1 -0
package/dist/core/fetcher.d.ts +33 -7
package/dist/core/fetcher.d.ts.map +1 -1
package/dist/core/fetcher.js +608 -41
package/dist/core/fetcher.js.map +1 -1
package/dist/core/jobs.d.ts +66 -0
package/dist/core/jobs.d.ts.map +1 -0
package/dist/core/jobs.js +513 -0
package/dist/core/jobs.js.map +1 -0
package/dist/core/markdown.d.ts.map +1 -1
package/dist/core/markdown.js +141 -31
package/dist/core/markdown.js.map +1 -1
package/dist/core/pdf.d.ts.map +1 -1
package/dist/core/pdf.js +3 -1
package/dist/core/pdf.js.map +1 -1
package/dist/core/screenshot.d.ts +33 -0
package/dist/core/screenshot.d.ts.map +1 -0
package/dist/core/screenshot.js +30 -0
package/dist/core/screenshot.js.map +1 -0
package/dist/core/search-provider.d.ts +46 -0
package/dist/core/search-provider.d.ts.map +1 -0
package/dist/core/search-provider.js +281 -0
package/dist/core/search-provider.js.map +1 -0
package/dist/core/strategies.d.ts +7 -10
package/dist/core/strategies.d.ts.map +1 -1
package/dist/core/strategies.js +370 -63
package/dist/core/strategies.js.map +1 -1
package/dist/index.d.ts +9 -3
package/dist/index.d.ts.map +1 -1
package/dist/index.js +61 -32
package/dist/index.js.map +1 -1
package/dist/mcp/server.js +335 -70
package/dist/mcp/server.js.map +1 -1
package/dist/types.d.ts +43 -1
package/dist/types.d.ts.map +1 -1
package/dist/types.js.map +1 -1
package/llms.txt +85 -47
package/package.json +11 -5

package/dist/core/agent.js CHANGED Viewed

@@ -1,9 +1,19 @@
 /**
  * Autonomous web research agent
  * Searches the web, fetches pages, and extracts structured data based on natural language prompts
+ *
+ * Supports:
+ * - depth: "basic" (1 search, top 3) vs "thorough" (multi-step, up to 3 searches, top 10)
+ * - maxSources: control how many sources to include (default 5, max 20)
+ * - topic: "general" | "news" | "technical" | "academic" — adjusts queries & prioritization
+ * - outputSchema: JSON Schema for structured output with validation
+ * - streaming callbacks for SSE support
  */
 import { load } from 'cheerio';
 import { peel } from '../index.js';
+// ---------------------------------------------------------------------------
+// Helpers
+// ---------------------------------------------------------------------------
 /**
  * Search DuckDuckGo HTML and parse results
  */
@@ -23,22 +33,17 @@ async function searchWeb(query, limit = 10) {
         $('.result').each((_, el) => {
             const link = $(el).find('.result__a');
             const snippet = $(el).find('.result__snippet');
-            const url = link.attr('href');
+            const rawUrl = link.attr('href');
             const title = link.text().trim();
             const desc = snippet.text().trim();
-            if (url && title) {
-                // DuckDuckGo uses redirect URLs, extract the actual URL
+            if (rawUrl && title) {
                 try {
-                    const actualUrl = url.startsWith('//')
-                        ? `https:${url}`
-                        : url.includes('uddg=')
-                            ? decodeURIComponent(url.split('uddg=')[1].split('&')[0])
-                            : url;
-                    results.push({
-                        url: actualUrl,
-                        title,
-                        snippet: desc,
-                    });
+                    const actualUrl = rawUrl.startsWith('//')
+                        ? `https:${rawUrl}`
+                        : rawUrl.includes('uddg=')
+                            ? decodeURIComponent(rawUrl.split('uddg=')[1].split('&')[0])
+                            : rawUrl;
+                    results.push({ url: actualUrl, title, snippet: desc });
                 }
                 catch {
                     // Skip malformed URLs
@@ -53,25 +58,73 @@ async function searchWeb(query, limit = 10) {
     }
 }
 /**
- * Call OpenAI-compatible LLM API
+ * Prioritise search results by topic relevance (higher = better)
+ */
+function scoreByTopic(result, topic) {
+    const url = result.url.toLowerCase();
+    const domain = (() => { try {
+        return new URL(url).hostname;
+    }
+    catch {
+        return '';
+    } })();
+    switch (topic) {
+        case 'academic':
+            if (/\.edu$|arxiv\.org|scholar\.google|pubmed|ieee\.org|acm\.org|researchgate\.net/.test(domain))
+                return 10;
+            if (/\.gov$/.test(domain))
+                return 5;
+            return 0;
+        case 'technical':
+            if (/github\.com|stackoverflow\.com|docs\.|developer\.|devdocs\.io|mdn\./.test(domain))
+                return 10;
+            if (/\.dev$|\.io$/.test(domain))
+                return 3;
+            return 0;
+        case 'news':
+            if (/reuters\.com|apnews\.com|bbc\.com|cnn\.com|nytimes\.com|theguardian\.com|bloomberg\.com|techcrunch\.com|theverge\.com|arstechnica\.com/.test(domain))
+                return 10;
+            if (/news|press|blog/.test(domain))
+                return 3;
+            return 0;
+        default:
+            return 0;
+    }
+}
+/**
+ * Add topic-specific modifiers to search queries
+ */
+function enhanceQueryForTopic(query, topic) {
+    switch (topic) {
+        case 'news':
+            return `${query} latest news 2026`;
+        case 'academic':
+            return `${query} research paper study`;
+        case 'technical':
+            return `${query} documentation tutorial`;
+        default:
+            return query;
+    }
+}
+/**
+ * Call OpenAI-compatible LLM API (non-streaming)
  */
 async function callLLM(messages, options) {
-    const { apiKey, model = 'gpt-4o-mini', baseUrl = 'https://api.openai.com/v1', schema } = options;
+    const { apiKey, model = 'gpt-4o-mini', baseUrl = 'https://api.openai.com/v1', jsonMode } = options;
     const { fetch: undiciFetch } = await import('undici');
     const body = {
         model,
         messages,
         temperature: 0,
     };
-    // Force JSON mode if schema is provided
-    if (schema) {
+    if (jsonMode) {
         body.response_format = { type: 'json_object' };
     }
     const response = await undiciFetch(`${baseUrl}/chat/completions`, {
         method: 'POST',
         headers: {
             'Content-Type': 'application/json',
-            'Authorization': `Bearer ${apiKey}`,
+            Authorization: `Bearer ${apiKey}`,
         },
         body: JSON.stringify(body),
     });
@@ -79,12 +132,116 @@ async function callLLM(messages, options) {
         const errorText = await response.text();
         throw new Error(`LLM API error ${response.status}: ${errorText}`);
     }
-    const result = await response.json();
+    const result = (await response.json());
     const content = result.choices?.[0]?.message?.content;
     if (!content) {
         throw new Error('LLM returned empty response');
     }
-    return content;
+    const usage = result.usage
+        ? { input: result.usage.prompt_tokens ?? 0, output: result.usage.completion_tokens ?? 0 }
+        : { input: 0, output: 0 };
+    return { content, usage };
+}
+/**
+ * Call OpenAI-compatible LLM API with streaming.
+ * Invokes `onChunk` for each text delta, returns full content when done.
+ */
+async function callLLMStreaming(messages, options, onChunk) {
+    if (!onChunk)
+        return callLLM(messages, options);
+    const { apiKey, model = 'gpt-4o-mini', baseUrl = 'https://api.openai.com/v1', jsonMode } = options;
+    const { fetch: undiciFetch } = await import('undici');
+    const body = {
+        model,
+        messages,
+        temperature: 0,
+        stream: true,
+        stream_options: { include_usage: true },
+    };
+    if (jsonMode) {
+        body.response_format = { type: 'json_object' };
+    }
+    const response = await undiciFetch(`${baseUrl}/chat/completions`, {
+        method: 'POST',
+        headers: {
+            'Content-Type': 'application/json',
+            Authorization: `Bearer ${apiKey}`,
+        },
+        body: JSON.stringify(body),
+    });
+    if (!response.ok) {
+        const errorText = await response.text();
+        throw new Error(`LLM API error ${response.status}: ${errorText}`);
+    }
+    let fullContent = '';
+    let usage = { input: 0, output: 0 };
+    // Read the SSE stream
+    const reader = response.body?.getReader?.();
+    if (!reader) {
+        // Fallback: consume entire body
+        const text = await response.text();
+        return { content: text, usage };
+    }
+    const decoder = new TextDecoder();
+    let buffer = '';
+    while (true) {
+        const { done, value } = await reader.read();
+        if (done)
+            break;
+        buffer += decoder.decode(value, { stream: true });
+        const lines = buffer.split('\n');
+        buffer = lines.pop() || '';
+        for (const line of lines) {
+            const trimmed = line.trim();
+            if (!trimmed || !trimmed.startsWith('data: '))
+                continue;
+            const data = trimmed.slice(6);
+            if (data === '[DONE]')
+                continue;
+            try {
+                const parsed = JSON.parse(data);
+                const delta = parsed.choices?.[0]?.delta?.content;
+                if (delta) {
+                    fullContent += delta;
+                    onChunk(delta);
+                }
+                // Final chunk may include usage
+                if (parsed.usage) {
+                    usage = {
+                        input: parsed.usage.prompt_tokens ?? 0,
+                        output: parsed.usage.completion_tokens ?? 0,
+                    };
+                }
+            }
+            catch {
+                // Skip unparseable lines
+            }
+        }
+    }
+    return { content: fullContent, usage };
+}
+/**
+ * Validate JSON data against a JSON Schema (best-effort, no extra deps)
+ */
+function validateJsonSchema(data, schema) {
+    // Lightweight validation: check required fields and top-level types
+    if (schema.type === 'object' && schema.properties) {
+        if (typeof data !== 'object' || data === null || Array.isArray(data)) {
+            return { valid: false, errors: 'Expected an object' };
+        }
+        if (schema.required && Array.isArray(schema.required)) {
+            const missing = schema.required.filter((k) => !(k in data));
+            if (missing.length > 0) {
+                return { valid: false, errors: `Missing required fields: ${missing.join(', ')}` };
+            }
+        }
+    }
+    else if (schema.type === 'array') {
+        if (!Array.isArray(data)) {
+            return { valid: false, errors: 'Expected an array' };
+        }
+    }
+    return { valid: true };
 }
 /**
  * Truncate content to approximately N tokens (rough estimate: 1 token ≈ 4 chars)
@@ -95,114 +252,199 @@ function truncateContent(content, maxTokens = 3000) {
         return content;
     return content.slice(0, maxChars) + '\n\n[Content truncated...]';
 }
+// ---------------------------------------------------------------------------
+// Main agent
+// ---------------------------------------------------------------------------
 /**
  * Run autonomous web research agent
  */
 export async function runAgent(options) {
-    const { prompt, urls: startUrls = [], schema, llmApiKey, llmApiBase = 'https://api.openai.com/v1', llmModel = 'gpt-4o-mini', maxPages = 10, maxCredits, onProgress, } = options;
-    if (!llmApiKey) {
+    const { prompt, urls: startUrls = [], schema: legacySchema, outputSchema, llmApiKey, llmApiBase = 'https://api.openai.com/v1', llmModel = 'gpt-4o-mini', maxPages, maxSources: rawMaxSources, depth = 'basic', topic = 'general', maxCredits, onProgress, onEvent, } = options;
+    if (!llmApiKey)
         throw new Error('llmApiKey is required');
-    }
-    if (!prompt) {
+    if (!prompt)
         throw new Error('prompt is required');
-    }
-    const maxIterations = Math.min(maxPages, 10);
+    // Effective schema = outputSchema || legacy schema
+    const effectiveSchema = outputSchema || legacySchema;
+    // Determine effective maxSources:
+    //   new param > legacy maxPages > depth-based default
+    const depthDefaults = depth === 'thorough'
+        ? { maxSources: 10, maxQueries: 3, resultsPerQuery: 10 }
+        : { maxSources: 3, maxQueries: 1, resultsPerQuery: 5 };
+    const maxSourcesLimit = Math.min(rawMaxSources ?? maxPages ?? depthDefaults.maxSources, 20);
+    const maxQueries = depth === 'thorough' ? depthDefaults.maxQueries : depthDefaults.maxQueries;
     const visitedUrls = new Set();
     const sources = [];
+    const sourcesDetailed = [];
     let pagesVisited = 0;
     let creditsUsed = 0;
-    // Collected data from all pages
+    let totalUsage = { input: 0, output: 0 };
     const collectedData = [];
+    // Emit both legacy progress and new event
     const reportProgress = (status, message, currentUrl) => {
         if (onProgress) {
-            onProgress({
-                status,
-                currentUrl,
-                pagesVisited,
-                message,
-            });
+            onProgress({ status, currentUrl, pagesVisited, message });
         }
     };
+    const emit = (event) => {
+        if (onEvent)
+            onEvent(event);
+    };
+    const accUsage = (u) => {
+        totalUsage.input += u.input;
+        totalUsage.output += u.output;
+    };
     try {
-        // Step 1: Determine initial search strategy
-        reportProgress('searching', 'Planning research strategy...');
+        // -----------------------------------------------------------------------
+        // Step 1: Determine search strategy & collect URLs
+        // -----------------------------------------------------------------------
         let urlsToVisit = [...startUrls];
-        // If no starting URLs, ask LLM to generate search queries
         if (urlsToVisit.length === 0) {
+            reportProgress('searching', 'Planning research strategy...');
+            const queryCount = depth === 'thorough' ? '3-5' : '2-3';
+            const topicHint = topic !== 'general'
+                ? `\nFocus queries on ${topic} sources.`
+                : '';
             const planningMessages = [
                 {
                     role: 'system',
-                    content: 'You are a web research assistant. Generate 2-3 specific search queries to find information for the user\'s request. Return JSON only: {"queries": ["query1", "query2", "query3"]}',
-                },
-                {
-                    role: 'user',
-                    content: `Research request: ${prompt}`,
+                    content: `You are a web research assistant. Generate ${queryCount} specific search queries to find information for the user's request.${topicHint}\nReturn JSON only: {"queries": ["query1", "query2", ...]}`,
                 },
+                { role: 'user', content: `Research request: ${prompt}` },
             ];
             const planResponse = await callLLM(planningMessages, {
                 apiKey: llmApiKey,
                 model: llmModel,
                 baseUrl: llmApiBase,
-                schema: { queries: ['string'] },
+                jsonMode: true,
             });
             creditsUsed++;
+            accUsage(planResponse.usage);
             let queries = [];
             try {
-                const parsed = JSON.parse(planResponse);
+                const parsed = JSON.parse(planResponse.content);
                 queries = parsed.queries || [];
             }
             catch {
-                // Fallback: use the prompt as the query
                 queries = [prompt];
             }
-            // Search for URLs
-            reportProgress('searching', `Searching: ${queries.join(', ')}`);
-            for (const query of queries.slice(0, 2)) { // Limit to 2 queries
-                const results = await searchWeb(query, 5);
+            // Limit queries to maxQueries
+            const effectiveQueries = queries.slice(0, maxQueries);
+            for (const rawQuery of effectiveQueries) {
+                const query = topic !== 'general' ? enhanceQueryForTopic(rawQuery, topic) : rawQuery;
+                reportProgress('searching', `Searching: ${query}`);
+                emit({ type: 'step', action: 'searching', query });
+                const results = await searchWeb(query, depthDefaults.resultsPerQuery);
+                // Sort by topic relevance
+                if (topic !== 'general') {
+                    results.sort((a, b) => scoreByTopic(b, topic) - scoreByTopic(a, topic));
+                }
                 urlsToVisit.push(...results.map(r => r.url));
-                // Stop if we have enough URLs
-                if (urlsToVisit.length >= maxPages)
-                    break;
+                if (urlsToVisit.length >= maxSourcesLimit * 2)
+                    break; // fetch a bit more than needed to account for failures
             }
-            // Deduplicate
-            urlsToVisit = [...new Set(urlsToVisit)];
+            // Deduplicate by hostname+pathname
+            const seen = new Set();
+            urlsToVisit = urlsToVisit.filter(u => {
+                try {
+                    const key = new URL(u).hostname + new URL(u).pathname;
+                    if (seen.has(key))
+                        return false;
+                    seen.add(key);
+                    return true;
+                }
+                catch {
+                    return false;
+                }
+            });
         }
+        // -----------------------------------------------------------------------
         // Step 2: Visit pages and collect data
-        for (const url of urlsToVisit.slice(0, maxIterations)) {
-            // Check credit limit
+        // -----------------------------------------------------------------------
+        const maxToFetch = Math.min(urlsToVisit.length, maxSourcesLimit);
+        for (const url of urlsToVisit.slice(0, maxToFetch + 5)) {
+            // Enough data collected?
+            if (collectedData.length >= maxSourcesLimit)
+                break;
             if (maxCredits && creditsUsed >= maxCredits) {
                 reportProgress('done', 'Credit limit reached');
                 break;
             }
-            // Skip already visited URLs
             if (visitedUrls.has(url))
                 continue;
             visitedUrls.add(url);
             reportProgress('visiting', `Fetching: ${url}`, url);
+            emit({ type: 'step', action: 'fetching', url });
             try {
-                // Fetch the page
-                const result = await peel(url, {
-                    format: 'markdown',
-                    timeout: 15000,
-                });
+                const result = await peel(url, { format: 'markdown', timeout: 15000 });
                 pagesVisited++;
-                creditsUsed++; // Count each page fetch as 1 credit
-                // Truncate content to avoid token overflow
-                const truncated = truncateContent(result.content, 3000);
-                collectedData.push({
-                    url: result.url,
-                    title: result.title,
-                    content: truncated,
-                });
+                creditsUsed++;
+                const truncated = truncateContent(result.content, depth === 'thorough' ? 4000 : 3000);
+                collectedData.push({ url: result.url, title: result.title, content: truncated });
                 sources.push(result.url);
+                sourcesDetailed.push({ url: result.url, title: result.title });
                 reportProgress('visiting', `Fetched: ${result.title}`, url);
             }
             catch (error) {
                 console.error(`Failed to fetch ${url}:`, error.message);
-                // Continue with other URLs
             }
         }
-        // Step 3: Extract and compile final data
+        // -----------------------------------------------------------------------
+        // Step 2b (thorough only): Cross-reference — ask LLM if more info needed
+        // -----------------------------------------------------------------------
+        if (depth === 'thorough' && collectedData.length > 0 && collectedData.length < maxSourcesLimit) {
+            reportProgress('searching', 'Cross-referencing — checking for gaps...');
+            emit({ type: 'step', action: 'analyzing', summary: 'Cross-referencing collected data for gaps...' });
+            const gapMessages = [
+                {
+                    role: 'system',
+                    content: 'You are a web research assistant. Given the user\'s research request and summaries of pages already visited, identify any gaps. If more searches would help, return JSON: {"queries":["q1"]}. If no gaps, return {"queries":[]}.',
+                },
+                {
+                    role: 'user',
+                    content: `Research request: ${prompt}\n\nPages visited:\n${collectedData.map(d => `- ${d.title} (${d.url})`).join('\n')}`,
+                },
+            ];
+            try {
+                const gapResponse = await callLLM(gapMessages, {
+                    apiKey: llmApiKey, model: llmModel, baseUrl: llmApiBase, jsonMode: true,
+                });
+                creditsUsed++;
+                accUsage(gapResponse.usage);
+                const gapParsed = JSON.parse(gapResponse.content);
+                const gapQueries = (gapParsed.queries || []).slice(0, 2);
+                for (const q of gapQueries) {
+                    emit({ type: 'step', action: 'searching', query: q });
+                    const results = await searchWeb(q, 5);
+                    for (const r of results) {
+                        if (collectedData.length >= maxSourcesLimit)
+                            break;
+                        if (visitedUrls.has(r.url))
+                            continue;
+                        visitedUrls.add(r.url);
+                        emit({ type: 'step', action: 'fetching', url: r.url });
+                        try {
+                            const result = await peel(r.url, { format: 'markdown', timeout: 15000 });
+                            pagesVisited++;
+                            creditsUsed++;
+                            const truncated = truncateContent(result.content, 4000);
+                            collectedData.push({ url: result.url, title: result.title, content: truncated });
+                            sources.push(result.url);
+                            sourcesDetailed.push({ url: result.url, title: result.title });
+                        }
+                        catch {
+                            // skip
+                        }
+                    }
+                }
+            }
+            catch {
+                // Non-critical — continue with what we have
+            }
+        }
+        // -----------------------------------------------------------------------
+        // Step 3: Extract / synthesise final answer
+        // -----------------------------------------------------------------------
         if (collectedData.length === 0) {
             return {
                 success: false,
@@ -210,18 +452,30 @@ export async function runAgent(options) {
                 sources: [],
                 pagesVisited,
                 creditsUsed,
+                tokensUsed: totalUsage,
             };
         }
         reportProgress('extracting', 'Analyzing collected data...');
-        // Build context from all collected pages
+        emit({ type: 'step', action: 'analyzing', summary: `Synthesizing answer from ${collectedData.length} sources...` });
         const context = collectedData
             .map(d => `Source: ${d.url}\nTitle: ${d.title}\n\n${d.content}`)
             .join('\n\n---\n\n');
-        const truncatedContext = truncateContent(context, 8000); // Larger budget for final analysis
-        // Build system prompt
-        const systemPrompt = schema
-            ? `You are a web research assistant. Extract structured data from the provided web content based on the user's request. Return a JSON object matching this schema:\n${JSON.stringify(schema, null, 2)}\n\nReturn ONLY valid JSON, no explanation.`
-            : `You are a web research assistant. Extract and compile information from the provided web content based on the user's request. Return a JSON object with your findings. Be comprehensive but concise. Return ONLY valid JSON, no explanation.`;
+        const truncatedContext = truncateContent(context, depth === 'thorough' ? 12000 : 8000);
+        // Build system prompt based on schema or free-form
+        let systemPrompt;
+        if (effectiveSchema) {
+            systemPrompt =
+                'You are a web research assistant. Extract structured data from the provided web content based on the user\'s request. ' +
+                    `Return a JSON object matching this schema:\n${JSON.stringify(effectiveSchema, null, 2)}\n\nReturn ONLY valid JSON, no explanation.`;
+        }
+        else {
+            systemPrompt =
+                'You are a web research assistant. Based on the provided web content, answer the user\'s research question. ' +
+                    'Provide a comprehensive, well-structured answer. Return a JSON object with:\n' +
+                    '- "answer": your detailed answer as a string (use markdown formatting)\n' +
+                    '- "keyFindings": array of key facts/findings\n' +
+                    'Return ONLY valid JSON, no explanation.';
+        }
         const extractMessages = [
             { role: 'system', content: systemPrompt },
             {
@@ -229,29 +483,62 @@ export async function runAgent(options) {
                 content: `Research request: ${prompt}\n\nCollected data from ${collectedData.length} web pages:\n\n${truncatedContext}`,
             },
         ];
-        const extractResponse = await callLLM(extractMessages, {
-            apiKey: llmApiKey,
-            model: llmModel,
-            baseUrl: llmApiBase,
-            schema: schema || {},
-        });
+        // Use streaming LLM call when onEvent is present
+        const hasStreaming = !!onEvent;
+        const extractResponse = await callLLMStreaming(extractMessages, { apiKey: llmApiKey, model: llmModel, baseUrl: llmApiBase, jsonMode: true }, hasStreaming ? (text) => emit({ type: 'chunk', text }) : undefined);
         creditsUsed++;
+        accUsage(extractResponse.usage);
         // Parse final result
         let finalData;
         try {
-            finalData = JSON.parse(extractResponse);
+            finalData = JSON.parse(extractResponse.content);
         }
         catch {
-            // If JSON parsing fails, return the raw response wrapped in an object
-            finalData = { result: extractResponse };
+            finalData = { result: extractResponse.content };
         }
+        // Validate against outputSchema if provided
+        if (outputSchema) {
+            const validation = validateJsonSchema(finalData, outputSchema);
+            if (!validation.valid) {
+                // Try once more: ask LLM to fix
+                try {
+                    const fixMessages = [
+                        {
+                            role: 'system',
+                            content: `The previous response did not match the required JSON schema. Fix it.\nSchema: ${JSON.stringify(outputSchema)}\nErrors: ${validation.errors}\nReturn ONLY valid JSON.`,
+                        },
+                        { role: 'user', content: extractResponse.content },
+                    ];
+                    const fixResponse = await callLLM(fixMessages, {
+                        apiKey: llmApiKey, model: llmModel, baseUrl: llmApiBase, jsonMode: true,
+                    });
+                    creditsUsed++;
+                    accUsage(fixResponse.usage);
+                    finalData = JSON.parse(fixResponse.content);
+                }
+                catch {
+                    // Return what we have with a warning
+                    finalData._validationWarning = `Output did not match schema: ${validation.errors}`;
+                }
+            }
+        }
+        const answerText = typeof finalData?.answer === 'string' ? finalData.answer : undefined;
         reportProgress('done', `Completed: ${pagesVisited} pages visited`);
+        emit({
+            type: 'done',
+            answer: answerText || JSON.stringify(finalData),
+            sources: sourcesDetailed,
+            tokensUsed: totalUsage,
+        });
         return {
             success: true,
             data: finalData,
+            answer: answerText,
             sources,
+            sourcesDetailed,
             pagesVisited,
             creditsUsed,
+            tokensUsed: totalUsage,
         };
     }
     catch (error) {
@@ -260,8 +547,10 @@ export async function runAgent(options) {
             success: false,
             data: { error: error.message || 'Unknown error occurred' },
             sources,
+            sourcesDetailed,
             pagesVisited,
             creditsUsed,
+            tokensUsed: totalUsage,
         };
     }
 }