npm - brave-real-browser-mcp-server - Versions diffs - 2.15.5 → 2.15.6 - Mend

brave-real-browser-mcp-server 2.15.5 → 2.15.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/dist/handlers/multi-element-handlers.js +0 -67
package/dist/handlers/navigation-handlers.js +59 -0
package/dist/handlers/search-filter-handlers.js +0 -121
package/dist/index.js +5 -17
package/dist/tool-definitions.js +1 -58
package/package.json +2 -2
package/scripts/full-verification.ts +98 -0
package/scripts/live-verification.ts +61 -0
package/dist/handlers/data-processing-handlers.js +0 -49
package/dist/handlers/pagination-handlers.js +0 -115

package/dist/handlers/multi-element-handlers.js CHANGED Viewed

@@ -67,73 +67,6 @@ export async function handleBatchElementScraper(args) {
         };
     }, 'Failed to batch scrape elements');
 }
-/**
- * Parent-child relationships maintain करते हुए data निकालता है
- */
-export async function handleNestedDataExtraction(args) {
-    return await withErrorHandling(async () => {
-        validateWorkflow('nested_data_extraction', {
-            requireBrowser: true,
-            requirePage: true,
-        });
-        const page = getCurrentPage();
-        const parentSelector = args.parentSelector;
-        const childSelector = args.childSelector;
-        const maxParents = args.maxParents || 50;
-        const nestedData = await page.evaluate(({ parentSelector, childSelector, maxParents }) => {
-            const parents = document.querySelectorAll(parentSelector);
-            const results = [];
-            let count = 0;
-            parents.forEach((parent) => {
-                if (count >= maxParents)
-                    return;
-                const parentData = {
-                    selector: parentSelector,
-                    text: Array.from(parent.childNodes)
-                        .filter((node) => node.nodeType === Node.TEXT_NODE)
-                        .map((node) => node.textContent?.trim())
-                        .filter((text) => text)
-                        .join(' '),
-                    attributes: {},
-                };
-                // Get parent attributes
-                Array.from(parent.attributes).forEach((attr) => {
-                    parentData.attributes[attr.name] = attr.value;
-                });
-                // Get children
-                const children = parent.querySelectorAll(childSelector);
-                const childrenData = [];
-                children.forEach((child) => {
-                    const childData = {
-                        selector: childSelector,
-                        text: child.textContent?.trim() || '',
-                        attributes: {},
-                    };
-                    Array.from(child.attributes).forEach((attr) => {
-                        childData.attributes[attr.name] = attr.value;
-                    });
-                    childrenData.push(childData);
-                });
-                if (childrenData.length > 0) {
-                    results.push({
-                        parent: parentData,
-                        children: childrenData,
-                    });
-                    count++;
-                }
-            });
-            return results;
-        }, { parentSelector, childSelector, maxParents });
-        return {
-            content: [
-                {
-                    type: 'text',
-                    text: `✅ Extracted ${nestedData.length} parent-child relationships\n\n${JSON.stringify(nestedData, null, 2)}`,
-                },
-            ],
-        };
-    }, 'Failed to extract nested data');
-}
 /**
  * सभी elements के attributes (href, src, data-*) collect करता है
  */

package/dist/handlers/navigation-handlers.js CHANGED Viewed

@@ -143,3 +143,62 @@ async function withWorkflowValidation(toolName, args, operation) {
         throw error;
     }
 }
+/**
+ * Site structure follow करके pages scrape करता है
+ */
+export async function handleBreadcrumbNavigator(args) {
+    return await withWorkflowValidation('breadcrumb_navigator', args, async () => {
+        return await withErrorHandling(async () => {
+            const page = getPageInstance();
+            if (!page) {
+                throw new Error('Browser not initialized. Call browser_init first.');
+            }
+            const breadcrumbSelector = args.breadcrumbSelector || '.breadcrumb, nav[aria-label="breadcrumb"], .breadcrumbs';
+            const followLinks = args.followLinks || false;
+            const breadcrumbData = await page.evaluate((selector) => {
+                const breadcrumbs = document.querySelectorAll(selector);
+                const results = [];
+                breadcrumbs.forEach((breadcrumb) => {
+                    const links = breadcrumb.querySelectorAll('a');
+                    const items = [];
+                    links.forEach((link, index) => {
+                        items.push({
+                            text: link.textContent?.trim() || '',
+                            href: link.href,
+                            level: index,
+                        });
+                    });
+                    if (items.length > 0) {
+                        results.push({
+                            path: items.map((i) => i.text).join(' > '),
+                            links: items,
+                        });
+                    }
+                });
+                return results;
+            }, breadcrumbSelector);
+            if (breadcrumbData.length === 0) {
+                return {
+                    content: [
+                        {
+                            type: 'text',
+                            text: '❌ No breadcrumbs found on page',
+                        },
+                    ],
+                };
+            }
+            let additionalData = '';
+            if (followLinks && breadcrumbData[0]?.links) {
+                additionalData = `\n\n📌 To scrape breadcrumb pages, use multi_page_scraper with URLs: ${JSON.stringify(breadcrumbData[0].links.map((l) => l.href))}`;
+            }
+            return {
+                content: [
+                    {
+                        type: 'text',
+                        text: `✅ Found ${breadcrumbData.length} breadcrumb trail(s)\n\n${JSON.stringify(breadcrumbData, null, 2)}${additionalData}`,
+                    },
+                ],
+            };
+        }, 'Failed to navigate breadcrumbs');
+    });
+}

package/dist/handlers/search-filter-handlers.js CHANGED Viewed

@@ -262,124 +262,3 @@ export async function handleAdvancedCSSSelectors(args) {
         return { content: [{ type: 'text', text: `❌ CSS selector query failed: ${error.message}` }], isError: true };
     }
 }
-/**
- * Visual Element Finder - Find elements by visual properties
- */
-export async function handleVisualElementFinder(args) {
-    const { url, criteria } = args;
-    try {
-        const page = getPageInstance();
-        if (!page) {
-            throw new Error('Browser not initialized. Call browser_init first.');
-        }
-        if (url && page.url() !== url) {
-            await page.goto(url, { waitUntil: 'networkidle2', timeout: 30000 });
-        }
-        const results = await page.evaluate((crit) => {
-            const allElements = Array.from(document.querySelectorAll('*'));
-            const matches = [];
-            allElements.forEach(element => {
-                const computed = window.getComputedStyle(element);
-                const rect = element.getBoundingClientRect();
-                let matchScore = 0;
-                const reasons = [];
-                // Check visibility
-                if (crit.visible !== undefined) {
-                    const isVisible = computed.display !== 'none' &&
-                        computed.visibility !== 'hidden' &&
-                        rect.width > 0 &&
-                        rect.height > 0;
-                    if (isVisible === crit.visible) {
-                        matchScore += 10;
-                        reasons.push('visibility');
-                    }
-                }
-                // Check color
-                if (crit.color) {
-                    if (computed.color.includes(crit.color) || computed.backgroundColor.includes(crit.color)) {
-                        matchScore += 5;
-                        reasons.push('color');
-                    }
-                }
-                // Check size
-                if (crit.minWidth && rect.width >= crit.minWidth) {
-                    matchScore += 3;
-                    reasons.push('minWidth');
-                }
-                if (crit.maxWidth && rect.width <= crit.maxWidth) {
-                    matchScore += 3;
-                    reasons.push('maxWidth');
-                }
-                if (crit.minHeight && rect.height >= crit.minHeight) {
-                    matchScore += 3;
-                    reasons.push('minHeight');
-                }
-                if (crit.maxHeight && rect.height <= crit.maxHeight) {
-                    matchScore += 3;
-                    reasons.push('maxHeight');
-                }
-                // Check position
-                if (crit.position) {
-                    if (computed.position === crit.position) {
-                        matchScore += 5;
-                        reasons.push('position');
-                    }
-                }
-                // Check text content
-                if (crit.hasText !== undefined) {
-                    const hasText = (element.textContent?.trim().length || 0) > 0;
-                    if (hasText === crit.hasText) {
-                        matchScore += 5;
-                        reasons.push('hasText');
-                    }
-                }
-                // Check if element is in viewport
-                if (crit.inViewport !== undefined) {
-                    const inViewport = rect.top >= 0 &&
-                        rect.left >= 0 &&
-                        rect.bottom <= window.innerHeight &&
-                        rect.right <= window.innerWidth;
-                    if (inViewport === crit.inViewport) {
-                        matchScore += 5;
-                        reasons.push('inViewport');
-                    }
-                }
-                if (matchScore > 0) {
-                    matches.push({
-                        element: {
-                            tagName: element.tagName.toLowerCase(),
-                            id: element.id,
-                            className: element.className,
-                            text: element.textContent?.substring(0, 100)
-                        },
-                        score: matchScore,
-                        matchedCriteria: reasons,
-                        visualProperties: {
-                            display: computed.display,
-                            visibility: computed.visibility,
-                            position: computed.position,
-                            color: computed.color,
-                            backgroundColor: computed.backgroundColor,
-                            width: rect.width,
-                            height: rect.height,
-                            top: rect.top,
-                            left: rect.left
-                        }
-                    });
-                }
-            });
-            matches.sort((a, b) => b.score - a.score);
-            return {
-                totalMatches: matches.length,
-                topMatches: matches.slice(0, 20)
-            };
-        }, criteria);
-        const resultText = `✅ Visual Element Finder Results\n\nCriteria: ${JSON.stringify(criteria, null, 2)}\nTotal Matches: ${results.totalMatches}\n\nTop Matches:\n${JSON.stringify(results.topMatches, null, 2)}`;
-        return {
-            content: [{ type: 'text', text: resultText }],
-        };
-    }
-    catch (error) {
-        return { content: [{ type: 'text', text: `❌ Visual element finder failed: ${error.message}` }], isError: true };
-    }
-}

package/dist/index.js CHANGED Viewed

@@ -28,15 +28,13 @@ import { handleSaveContentAsMarkdown } from "./handlers/file-handlers.js";
 // Import new data extraction handlers
 import { handleExtractJSON, handleScrapeMetaTags, handleExtractSchema, } from "./handlers/data-extraction-handlers.js";
 // Import multi-element handlers
-import { handleBatchElementScraper, handleNestedDataExtraction, handleAttributeHarvester, handleLinkHarvester, handleMediaExtractor, } from "./handlers/multi-element-handlers.js";
+import { handleBatchElementScraper, handleAttributeHarvester, handleLinkHarvester, handleMediaExtractor, } from "./handlers/multi-element-handlers.js";
 // Import pagination handlers
-import { handleMultiPageScraper, handleBreadcrumbNavigator, } from "./handlers/pagination-handlers.js";
-// Import data processing handlers
-import { handleHTMLToText, } from "./handlers/data-processing-handlers.js";
+import { handleBreadcrumbNavigator, } from "./handlers/navigation-handlers.js";
 // Import AI-powered handlers
 import { handleSmartSelectorGenerator, handleContentClassification, } from "./handlers/ai-powered-handlers.js";
 // Import search & filter handlers
-import { handleKeywordSearch, handleRegexPatternMatcher, handleXPathSupport, handleAdvancedCSSSelectors, handleVisualElementFinder, } from "./handlers/search-filter-handlers.js";
+import { handleKeywordSearch, handleRegexPatternMatcher, handleXPathSupport, handleAdvancedCSSSelectors, } from "./handlers/search-filter-handlers.js";
 // Import data quality handlers
 import { handleDataTypeValidator, } from "./handlers/data-quality-handlers.js";
 // Import captcha handlers
@@ -152,9 +150,6 @@ export async function executeToolByName(name, args) {
             case TOOL_NAMES.BATCH_ELEMENT_SCRAPER:
                 result = await handleBatchElementScraper(args);
                 break;
-            case TOOL_NAMES.NESTED_DATA_EXTRACTION:
-                result = await handleNestedDataExtraction(args);
-                break;
             case TOOL_NAMES.ATTRIBUTE_HARVESTER:
                 result = await handleAttributeHarvester(args);
                 break;
@@ -167,16 +162,12 @@ export async function executeToolByName(name, args) {
                 break;
             // Pagination Tools
             // Pagination Tools
-            case TOOL_NAMES.MULTI_PAGE_SCRAPER:
-                result = await handleMultiPageScraper(args);
-                break;
+            // Pagination Tools
             case TOOL_NAMES.BREADCRUMB_NAVIGATOR:
                 result = await handleBreadcrumbNavigator(args || {});
                 break;
             // Data Processing Tools
-            case TOOL_NAMES.HTML_TO_TEXT:
-                result = await handleHTMLToText(args);
-                break;
+            // Data Processing Tools
             // AI-Powered Features
             case TOOL_NAMES.SMART_SELECTOR_GENERATOR:
                 result = await handleSmartSelectorGenerator(args);
@@ -197,9 +188,6 @@ export async function executeToolByName(name, args) {
             case TOOL_NAMES.ADVANCED_CSS_SELECTORS:
                 result = await handleAdvancedCSSSelectors(args);
                 break;
-            case TOOL_NAMES.VISUAL_ELEMENT_FINDER:
-                result = await handleVisualElementFinder(args);
-                break;
             // Data Quality & Validation
             case TOOL_NAMES.DATA_TYPE_VALIDATOR:
                 result = await handleDataTypeValidator(args);

package/dist/tool-definitions.js CHANGED Viewed

@@ -381,19 +381,6 @@ export const TOOLS = [
             required: ['selector'],
         },
     },
-    {
-        name: 'nested_data_extraction',
-        description: 'Extract data maintaining parent-child relationships',
-        inputSchema: {
-            type: 'object',
-            properties: {
-                parentSelector: { type: 'string' },
-                childSelector: { type: 'string' },
-                maxParents: { type: 'number', default: 50 },
-            },
-            required: ['parentSelector', 'childSelector'],
-        },
-    },
     {
         name: 'attribute_harvester',
         description: 'Collect attributes (href, src, data-*) from elements',
@@ -432,19 +419,6 @@ export const TOOLS = [
         },
     },
     // Pagination Tools
-    {
-        name: 'multi_page_scraper',
-        description: 'Collect and merge data from multiple pages',
-        inputSchema: {
-            type: 'object',
-            properties: {
-                urls: { type: 'array', items: { type: 'string' } },
-                dataSelector: { type: 'string' },
-                waitBetweenPages: { type: 'number', default: 1000 },
-            },
-            required: ['urls', 'dataSelector'],
-        },
-    },
     {
         name: 'breadcrumb_navigator',
         description: 'Extract navigation path by following site structure',
@@ -457,19 +431,7 @@ export const TOOLS = [
         },
     },
     // Data Processing Tools
-    {
-        name: 'html_to_text',
-        description: 'Convert HTML content to clean text',
-        inputSchema: {
-            type: 'object',
-            properties: {
-                html: { type: 'string' },
-                preserveLinks: { type: 'boolean', default: false },
-                preserveFormatting: { type: 'boolean', default: false },
-            },
-            required: ['html'],
-        },
-    },
+    // Data Validation Tools
     // Data Validation Tools
     // AI-Powered Features (5 tools)
     {
@@ -553,21 +515,6 @@ export const TOOLS = [
             required: ['selector'],
         },
     },
-    {
-        name: 'visual_element_finder',
-        description: 'Find elements by visual properties',
-        inputSchema: {
-            type: 'object',
-            properties: {
-                url: { type: 'string' },
-                criteria: {
-                    type: 'object',
-                    description: 'Visual criteria (color, size, position, etc.)'
-                },
-            },
-            required: ['criteria'],
-        },
-    },
     // Data Quality & Validation (5 tools)
     {
         name: 'data_type_validator',
@@ -1001,7 +948,6 @@ export const TOOL_NAMES = {
     EXTRACT_SCHEMA: 'extract_schema',
     // Multi-Element Extractors
     BATCH_ELEMENT_SCRAPER: 'batch_element_scraper',
-    NESTED_DATA_EXTRACTION: 'nested_data_extraction',
     ATTRIBUTE_HARVESTER: 'attribute_harvester',
     // Content Type Specific
     LINK_HARVESTER: 'link_harvester',
@@ -1020,10 +966,8 @@ export const TOOL_NAMES = {
     NETWORK_RECORDER: 'network_recorder',
     API_FINDER: 'api_finder',
     // Pagination Tools
-    MULTI_PAGE_SCRAPER: 'multi_page_scraper',
     BREADCRUMB_NAVIGATOR: 'breadcrumb_navigator',
     // Data Processing
-    HTML_TO_TEXT: 'html_to_text',
     // AI-Powered Features
     SMART_SELECTOR_GENERATOR: 'smart_selector_generator',
     CONTENT_CLASSIFICATION: 'content_classification',
@@ -1036,7 +980,6 @@ export const TOOL_NAMES = {
     REGEX_PATTERN_MATCHER: 'regex_pattern_matcher',
     XPATH_SUPPORT: 'xpath_support',
     ADVANCED_CSS_SELECTORS: 'advanced_css_selectors',
-    VISUAL_ELEMENT_FINDER: 'visual_element_finder',
     // Data Quality & Validation
     DATA_TYPE_VALIDATOR: 'data_type_validator',
     // Advanced Captcha Handling

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "brave-real-browser-mcp-server",
-  "version": "2.15.5",
+  "version": "2.15.6",
   "description": "Universal AI IDE MCP Server - Auto-detects and supports all AI IDEs (Claude Desktop, Cursor, Windsurf, Cline, Zed, VSCode, Qoder AI, etc.) with Brave browser automation",
   "type": "module",
   "main": "dist/index.js",
@@ -34,7 +34,7 @@
     "test:brave:cleanup": "taskkill /F /IM brave.exe || pkill -f brave || true"
   },
   "dependencies": {
-    "@modelcontextprotocol/sdk": "^1.25.0",
+    "@modelcontextprotocol/sdk": "^1.25.1",
     "@types/turndown": "^5.0.6",
     "ajv": "^8.12.0",
     "axios": "^1.6.5",

package/scripts/full-verification.ts ADDED Viewed

@@ -0,0 +1,98 @@
+import { handleBrowserInit, handleBrowserClose } from '../src/handlers/browser-handlers.js';
+import { handleNavigate, handleWait } from '../src/handlers/navigation-handlers.js';
+import { handleGetContent, handleFindSelector } from '../src/handlers/content-handlers.js';
+import { handleBreadcrumbNavigator } from '../src/handlers/navigation-handlers.js';
+import {
+    handleBatchElementScraper,
+    handleAttributeHarvester,
+    handleLinkHarvester,
+    handleMediaExtractor
+} from '../src/handlers/multi-element-handlers.js';
+import {
+    handleKeywordSearch,
+    handleRegexPatternMatcher,
+    handleXPathSupport,
+    handleAdvancedCSSSelectors
+} from '../src/handlers/search-filter-handlers.js';
+import { handleRandomScroll } from '../src/handlers/interaction-handlers.js';
+import { handleScrapeMetaTags, handleExtractSchema } from '../src/handlers/data-extraction-handlers.js';
+async function runFullVerification() {
+    console.log('🚀 Starting Comprehensive Tool Verification...');
+    try {
+        await handleBrowserInit({ headless: true });
+        // Testing on one site primarily to save time, then brief check on second
+        const url = 'https://moviesdrive.forum/';
+        console.log(`\n--------------------------------------------------`);
+        console.log(`🔍 Targeting: ${url}`);
+        console.log(`--------------------------------------------------`);
+        // --- Navigation & Basic ---
+        console.log(`\n[1/12] 🟢 Testing Navigation & Wait...`);
+        await handleNavigate({ url });
+        await handleWait({ type: 'timeout', value: '2000' });
+        console.log('   ✅ Navigation complete.');
+        // --- Interaction ---
+        console.log(`\n[2/12] 🟢 Testing Random Scroll...`);
+        await handleRandomScroll({});
+        console.log('   ✅ Scroll complete.');
+        // --- Content Handlers ---
+        console.log(`\n[3/12] 🟢 Testing Find Selector (Text search)...`);
+        const findRes = await handleFindSelector({ text: 'Movie' }); // Assuming "Movie" exists
+        console.log(`   Result: Found ${findRes.content[0].text.length > 50 ? 'matches' : 'no matches'} (Length: ${findRes.content[0].text.length})`);
+        // --- Multi-Element Handlers (The file we kept) ---
+        console.log(`\n[4/12] 🟢 Testing Batch Element Scraper...`);
+        const batchRes = await handleBatchElementScraper({ selector: 'a', maxElements: 3 });
+        console.log(`   Result: ${batchRes.content[0].text.substring(0, 100)}...`);
+        console.log(`\n[5/12] 🟢 Testing Attribute Harvester...`);
+        const attrRes = await handleAttributeHarvester({ selector: 'img', attributes: ['src'], maxElements: 3 });
+        console.log(`   Result: ${attrRes.content[0].text.substring(0, 100)}...`);
+        console.log(`\n[6/12] 🟢 Testing Media Extractor...`); // Might be empty on home page but runs logic
+        const mediaRes = await handleMediaExtractor({ types: ['video', 'iframe'] });
+        console.log(`   Result: ${mediaRes.content[0].text.substring(0, 100)}...`);
+        // --- Search & Filter Handlers (The file we kept) ---
+        console.log(`\n[7/12] 🟢 Testing Keyword Search...`);
+        const keyRes = await handleKeywordSearch({ keywords: ['Bollywood', 'Hollywood'] });
+        console.log(`   Result: ${keyRes.content[0].text.substring(0, 100)}...`);
+        console.log(`\n[8/12] 🟢 Testing Regex Pattern Matcher...`);
+        const regexRes = await handleRegexPatternMatcher({ pattern: 'https?://[^\\s"\']+' });
+        console.log(`   Result: ${regexRes.content[0].text.substring(0, 100)}...`);
+        console.log(`\n[9/12] 🟢 Testing XPath Support...`);
+        const xpathRes = await handleXPathSupport({ xpath: '//body//div' });
+        console.log(`   Result: ${xpathRes.content[0].text.substring(0, 100)}...`);
+        console.log(`\n[10/12] 🟢 Testing Advanced CSS Selectors...`);
+        const cssRes = await handleAdvancedCSSSelectors({ selector: 'div > a', operation: 'query' });
+        console.log(`   Result: ${cssRes.content[0].text.substring(0, 100)}...`);
+        // --- Data Extraction ---
+        console.log(`\n[11/12] 🟢 Testing Schema Extraction...`);
+        const schemaRes = await handleExtractSchema({});
+        console.log(`   Result: ${schemaRes.content[0].text.substring(0, 100)}...`);
+        // --- Pagination (Refactored) ---
+        console.log(`\n[12/12] 🟢 Testing Breadcrumb Navigator...`);
+        const breadRes = await handleBreadcrumbNavigator({});
+        console.log(`   Result: ${breadRes.content[0].text.substring(0, 100)}...`);
+        console.log('\n✅ All primary handler categories verified successfully.');
+    } catch (error) {
+        console.error('\n❌ Verification Failed:', error);
+    } finally {
+        await handleBrowserClose({});
+    }
+}
+runFullVerification();

package/scripts/live-verification.ts ADDED Viewed

@@ -0,0 +1,61 @@
+import { handleBrowserInit, handleBrowserClose } from '../src/handlers/browser-handlers.js';
+import { handleNavigate } from '../src/handlers/navigation-handlers.js';
+import { handleGetContent } from '../src/handlers/content-handlers.js';
+import { handleBreadcrumbNavigator } from '../src/handlers/navigation-handlers.js';
+import { handleLinkHarvester } from '../src/handlers/multi-element-handlers.js';
+import { handleScrapeMetaTags } from '../src/handlers/data-extraction-handlers.js';
+async function runVerification() {
+    console.log('🚀 Starting Verification on Live Sites...');
+    try {
+        // 1. Initialize Browser
+        console.log('\n🔵 Initializing Browser...');
+        await handleBrowserInit({ headless: true });
+        const sites = [
+            'https://moviesdrive.forum/',
+            'https://multimovies.golf/'
+        ];
+        for (const url of sites) {
+            console.log(`\n--------------------------------------------------`);
+            console.log(`🔍 Testing Site: ${url}`);
+            console.log(`--------------------------------------------------`);
+            // 2. Navigate
+            console.log(`\n➡️ Navigating to ${url}...`);
+            await handleNavigate({ url });
+            // 3. Get Content (HTML preview)
+            console.log(`\n📄 Fetching Content (Preview)...`);
+            const contentRes = await handleGetContent({ type: 'text' });
+            console.log(`   Result: ${contentRes.content[0].text.substring(0, 100)}...`);
+            // 4. Test Breadcrumb Navigator (Newly moved)
+            console.log(`\nnav Testing Breadcrumb Navigator...`);
+            const breadcrumbRes = await handleBreadcrumbNavigator({});
+            console.log(`   Result: ${breadcrumbRes.content[0].text.substring(0, 200)}...`);
+            // 5. Test Link Harvester (Existing tool)
+            console.log(`\n🔗 Testing Link Harvester (First 5 links)...`);
+            const linksRes = await handleLinkHarvester({ maxElements: 5 });
+            console.log(`   Result: ${linksRes.content[0].text.substring(0, 200)}...`);
+            // 6. Test Meta Tags (Data extraction)
+            console.log(`\n🏷️ Testing Meta Tag Scraper...`);
+            const metaRes = await handleScrapeMetaTags({});
+            console.log(`   Result: ${metaRes.content[0].text.substring(0, 200)}...`);
+        }
+    } catch (error) {
+        console.error('\n❌ Verification Failed:', error);
+    } finally {
+        // 7. Cleanup
+        console.log('\n🔴 Closing Browser...');
+        await handleBrowserClose({});
+    }
+}
+runVerification();

package/dist/handlers/data-processing-handlers.js DELETED Viewed

@@ -1,49 +0,0 @@
-// Data Processing & Transformation Handlers
-// Text cleaning, validation, formatting utilities
-// @ts-nocheck
-import { withErrorHandling } from '../system-utils.js';
-/**
- * HTML tags intelligently remove करता है
- */
-export async function handleHTMLToText(args) {
-    return await withErrorHandling(async () => {
-        const html = args.html;
-        const preserveLinks = args.preserveLinks || false;
-        const preserveFormatting = args.preserveFormatting || false;
-        // Simple HTML to text conversion (can be enhanced with turndown)
-        let text = html;
-        // Preserve links if requested
-        if (preserveLinks) {
-            text = text.replace(/<a[^>]*href="([^"]*)"[^>]*>(.*?)<\/a>/gi, '$2 ($1)');
-        }
-        // Preserve basic formatting
-        if (preserveFormatting) {
-            text = text.replace(/<br\s*\/?>/gi, '\n');
-            text = text.replace(/<\/p>/gi, '\n\n');
-            text = text.replace(/<li>/gi, '• ');
-            text = text.replace(/<\/li>/gi, '\n');
-        }
-        // Remove all other HTML tags
-        text = text.replace(/<[^>]*>/g, '');
-        // Decode HTML entities
-        text = text
-            .replace(/&nbsp;/g, ' ')
-            .replace(/&amp;/g, '&')
-            .replace(/&lt;/g, '<')
-            .replace(/&gt;/g, '>')
-            .replace(/&quot;/g, '"')
-            .replace(/&#39;/g, "'");
-        // Clean up whitespace
-        text = text.replace(/\n\s*\n/g, '\n\n');
-        text = text.trim();
-        return {
-            content: [
-                {
-                    type: 'text',
-                    text: `✅ HTML converted to text\n\n${text}`,
-                },
-            ],
-        };
-    }, 'Failed to convert HTML to text');
-}
-// Duplicate Remover Arguments

package/dist/handlers/pagination-handlers.js DELETED Viewed

@@ -1,115 +0,0 @@
-// Pagination & Navigation Tools
-// Auto pagination, infinite scroll, multi-page scraping, sitemap parser
-// @ts-nocheck
-import { getCurrentPage } from '../browser-manager.js';
-import { validateWorkflow } from '../workflow-validation.js';
-import { withErrorHandling, sleep } from '../system-utils.js';
-/**
- * Multiple pages से data collect और merge करता है
- */
-export async function handleMultiPageScraper(args) {
-    return await withErrorHandling(async () => {
-        validateWorkflow('multi_page_scraper', {
-            requireBrowser: true,
-            requirePage: true,
-        });
-        const page = getCurrentPage();
-        const urls = args.urls;
-        const dataSelector = args.dataSelector;
-        const waitBetweenPages = args.waitBetweenPages || 1000;
-        const allData = [];
-        for (let i = 0; i < urls.length; i++) {
-            const url = urls[i];
-            try {
-                await page.goto(url, { waitUntil: 'domcontentloaded' });
-                await sleep(waitBetweenPages);
-                const pageData = await page.evaluate((selector) => {
-                    const elements = document.querySelectorAll(selector);
-                    return Array.from(elements).map((el) => ({
-                        text: el.textContent?.trim() || '',
-                        html: el.innerHTML,
-                    }));
-                }, dataSelector);
-                allData.push({
-                    url,
-                    pageIndex: i,
-                    itemCount: pageData.length,
-                    data: pageData,
-                });
-            }
-            catch (error) {
-                allData.push({
-                    url,
-                    pageIndex: i,
-                    error: error instanceof Error ? error.message : String(error),
-                });
-            }
-        }
-        return {
-            content: [
-                {
-                    type: 'text',
-                    text: `✅ Scraped ${urls.length} pages\n\n${JSON.stringify(allData, null, 2)}`,
-                },
-            ],
-        };
-    }, 'Failed to scrape multiple pages');
-}
-/**
- * Site structure follow करके pages scrape करता है
- */
-export async function handleBreadcrumbNavigator(args) {
-    return await withErrorHandling(async () => {
-        validateWorkflow('breadcrumb_navigator', {
-            requireBrowser: true,
-            requirePage: true,
-        });
-        const page = getCurrentPage();
-        const breadcrumbSelector = args.breadcrumbSelector || '.breadcrumb, nav[aria-label="breadcrumb"], .breadcrumbs';
-        const followLinks = args.followLinks || false;
-        const breadcrumbData = await page.evaluate((selector) => {
-            const breadcrumbs = document.querySelectorAll(selector);
-            const results = [];
-            breadcrumbs.forEach((breadcrumb) => {
-                const links = breadcrumb.querySelectorAll('a');
-                const items = [];
-                links.forEach((link, index) => {
-                    items.push({
-                        text: link.textContent?.trim() || '',
-                        href: link.href,
-                        level: index,
-                    });
-                });
-                if (items.length > 0) {
-                    results.push({
-                        path: items.map((i) => i.text).join(' > '),
-                        links: items,
-                    });
-                }
-            });
-            return results;
-        }, breadcrumbSelector);
-        if (breadcrumbData.length === 0) {
-            return {
-                content: [
-                    {
-                        type: 'text',
-                        text: '❌ No breadcrumbs found on page',
-                    },
-                ],
-            };
-        }
-        let additionalData = '';
-        if (followLinks && breadcrumbData[0]?.links) {
-            additionalData = `\n\n📌 To scrape breadcrumb pages, use multi_page_scraper with URLs: ${JSON.stringify(breadcrumbData[0].links.map((l) => l.href))}`;
-        }
-        return {
-            content: [
-                {
-                    type: 'text',
-                    text: `✅ Found ${breadcrumbData.length} breadcrumb trail(s)\n\n${JSON.stringify(breadcrumbData, null, 2)}${additionalData}`,
-                },
-            ],
-        };
-    }, 'Failed to navigate breadcrumbs');
-}