PyPI - iflow-mcp_janspoerer-mcp_browser_use - Versions diffs - 0.1.0__py3-none-any.whl - Mend

iflow-mcp_janspoerer-mcp_browser_use 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/METADATA +26 -0
iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/RECORD +50 -0
iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/WHEEL +5 -0
iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/entry_points.txt +2 -0
iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/licenses/LICENSE +201 -0
iflow_mcp_janspoerer_mcp_browser_use-0.1.0.dist-info/top_level.txt +1 -0
mcp_browser_use/__init__.py +2 -0
mcp_browser_use/__main__.py +1347 -0
mcp_browser_use/actions/__init__.py +1 -0
mcp_browser_use/actions/elements.py +173 -0
mcp_browser_use/actions/extraction.py +864 -0
mcp_browser_use/actions/keyboard.py +43 -0
mcp_browser_use/actions/navigation.py +73 -0
mcp_browser_use/actions/screenshots.py +85 -0
mcp_browser_use/browser/__init__.py +1 -0
mcp_browser_use/browser/chrome.py +150 -0
mcp_browser_use/browser/chrome_executable.py +204 -0
mcp_browser_use/browser/chrome_launcher.py +330 -0
mcp_browser_use/browser/chrome_process.py +104 -0
mcp_browser_use/browser/devtools.py +230 -0
mcp_browser_use/browser/driver.py +322 -0
mcp_browser_use/browser/process.py +133 -0
mcp_browser_use/cleaners.py +530 -0
mcp_browser_use/config/__init__.py +30 -0
mcp_browser_use/config/environment.py +155 -0
mcp_browser_use/config/paths.py +97 -0
mcp_browser_use/constants.py +68 -0
mcp_browser_use/context.py +150 -0
mcp_browser_use/context_pack.py +85 -0
mcp_browser_use/decorators/__init__.py +13 -0
mcp_browser_use/decorators/ensure.py +84 -0
mcp_browser_use/decorators/envelope.py +83 -0
mcp_browser_use/decorators/locking.py +172 -0
mcp_browser_use/helpers.py +173 -0
mcp_browser_use/helpers_context.py +261 -0
mcp_browser_use/locking/__init__.py +1 -0
mcp_browser_use/locking/action_lock.py +190 -0
mcp_browser_use/locking/file_mutex.py +139 -0
mcp_browser_use/locking/window_registry.py +178 -0
mcp_browser_use/tools/__init__.py +59 -0
mcp_browser_use/tools/browser_management.py +260 -0
mcp_browser_use/tools/debugging.py +195 -0
mcp_browser_use/tools/extraction.py +58 -0
mcp_browser_use/tools/interaction.py +323 -0
mcp_browser_use/tools/navigation.py +84 -0
mcp_browser_use/tools/screenshots.py +116 -0
mcp_browser_use/utils/__init__.py +1 -0
mcp_browser_use/utils/diagnostics.py +85 -0
mcp_browser_use/utils/html_utils.py +118 -0
mcp_browser_use/utils/retry.py +57 -0

mcp_browser_use/browser/driver.py ADDED Viewed

@@ -0,0 +1,322 @@
+"""WebDriver creation and window management."""
+import os
+import time
+import shutil
+import subprocess
+from typing import Optional
+from selenium import webdriver
+from selenium.common.exceptions import (
+    NoSuchWindowException,
+    WebDriverException,
+)
+import logging
+logger = logging.getLogger(__name__)
+# Import context for state management
+from ..context import get_context
+from .devtools import _ensure_debugger_ready, _handle_for_target
+from .process import make_process_tag, ensure_process_tag, chromedriver_log_path
+from ..locking.window_registry import (
+    cleanup_orphaned_windows,
+    _register_window,
+    _unregister_window,
+)
+def _ensure_driver() -> None:
+    """Attach Selenium to the debuggable Chrome instance (headed by default)."""
+    ctx = get_context()
+    if ctx.driver is not None:
+        return
+    _ensure_debugger_ready(ctx.config)
+    if not (ctx.debugger_host and ctx.debugger_port):
+        return
+    ctx.driver = create_webdriver(
+        ctx.debugger_host,
+        ctx.debugger_port,
+        ctx.config
+    )
+def _validate_window_context(driver: webdriver.Chrome, expected_target_id: str) -> bool:
+    """
+    Validate that the current window context matches the expected target.
+    Returns True if validation passes, False otherwise.
+    Handles NoSuchWindowException gracefully.
+    """
+    if not expected_target_id:
+        return False
+    try:
+        # Check if current window handle exists and matches expected target
+        current_handle = driver.current_window_handle
+        if current_handle and current_handle.endswith(expected_target_id):
+            return True
+        # Double-check by getting target info via CDP
+        try:
+            info = driver.execute_cdp_cmd("Target.getTargetInfo", {}) or {}
+            current_target = (info.get("targetInfo") or {}).get("targetId") or info.get("targetId")
+            return current_target == expected_target_id
+        except Exception:
+            pass
+        return False
+    except Exception:
+        # NoSuchWindowException or other window-related exceptions
+        return False
+def _ensure_singleton_window(driver: webdriver.Chrome):
+    """Ensure we have a singleton window for this process."""
+    ctx = get_context()
+    # 0) If we already have a target, validate context
+    if ctx.target_id:
+        if _validate_window_context(driver, ctx.target_id):
+            return
+        # Context validation failed - attempt recovery
+        h = _handle_for_target(driver, ctx.target_id)
+        if h:
+            try:
+                driver.switch_to.window(h)
+                if _validate_window_context(driver, ctx.target_id):
+                    return
+            except Exception:
+                pass
+        # Recovery failed - clear target and recreate
+        ctx.reset_window_state()
+    # 1) Create new window if we don't have a target
+    if not ctx.target_id:
+        # Cleanup orphaned windows
+        try:
+            cleanup_orphaned_windows(driver)
+        except Exception as e:
+            logger.debug(f"Window cleanup failed (non-critical): {e}")
+        try:
+            win = driver.execute_cdp_cmd("Browser.createWindow", {"state": "normal"})
+            if not isinstance(win, dict):
+                raise RuntimeError(f"Browser.createWindow returned {win!r}")
+            ctx.window_id = win.get("windowId")
+            ctx.target_id = win.get("targetId")
+            if not ctx.target_id:
+                # Fallback
+                t = driver.execute_cdp_cmd("Target.createTarget", {"url": "about:blank", "newWindow": True})
+                if not isinstance(t, dict) or "targetId" not in t:
+                    raise RuntimeError(f"Target.createTarget returned {t!r}")
+                ctx.target_id = t["targetId"]
+                if not ctx.window_id:
+                    try:
+                        w = driver.execute_cdp_cmd("Browser.getWindowForTarget", {"targetId": ctx.target_id}) or {}
+                        ctx.window_id = w.get("windowId")
+                    except Exception:
+                        ctx.window_id = None
+        except Exception:
+            # Last resort
+            t = driver.execute_cdp_cmd("Target.createTarget", {"url": "about:blank", "newWindow": True})
+            if not isinstance(t, dict) or "targetId" not in t:
+                raise RuntimeError(f"Target.createTarget returned {t!r}")
+            ctx.target_id = t["targetId"]
+            try:
+                w = driver.execute_cdp_cmd("Browser.getWindowForTarget", {"targetId": ctx.target_id}) or {}
+                ctx.window_id = w.get("windowId")
+            except Exception:
+                ctx.window_id = None
+    # 2) Map targetId -> Selenium handle
+    h = _handle_for_target(driver, ctx.target_id)
+    if not h:
+        for _ in range(20):
+            time.sleep(0.05)
+            h = _handle_for_target(driver, ctx.target_id)
+            if h:
+                break
+    if h:
+        driver.switch_to.window(h)
+        if not _validate_window_context(driver, ctx.target_id):
+            raise RuntimeError(f"Failed to establish correct window context for target {ctx.target_id}")
+        # Register window
+        try:
+            owner = ensure_process_tag()
+            _register_window(owner, ctx.target_id, ctx.window_id)
+        except Exception as e:
+            logger.debug(f"Window registration failed (non-critical): {e}")
+    else:
+        raise RuntimeError(f"Failed to find window handle for target {ctx.target_id}")
+def _ensure_driver_and_window() -> None:
+    """Ensure both driver and window are ready."""
+    _ensure_driver()
+    ctx = get_context()
+    if ctx.driver is None:
+        return
+    _ensure_singleton_window(ctx.driver)
+def _close_extra_blank_windows_safe(driver, exclude_handles=None) -> int:
+    """Close extra blank windows, only within our own OS window."""
+    exclude = set(exclude_handles or ())
+    ctx = get_context()
+    own_window_id = ctx.window_id
+    if own_window_id is None:
+        return 0
+    try:
+        keep = driver.current_window_handle
+    except Exception:
+        keep = None
+    closed = 0
+    for h in list(getattr(driver, "window_handles", [])):
+        if h in exclude or (keep and h == keep):
+            continue
+        try:
+            driver.switch_to.window(h)
+            # Map this handle -> targetId -> windowId
+            info = driver.execute_cdp_cmd("Target.getTargetInfo", {}) or {}
+            tid = (info.get("targetInfo") or {}).get("targetId") or info.get("targetId")
+            if not tid:
+                continue
+            w = driver.execute_cdp_cmd("Browser.getWindowForTarget", {"targetId": tid}) or {}
+            if w.get("windowId") != own_window_id:
+                # Belongs to another agent's OS window; do not touch
+                continue
+            url = (driver.current_url or "").lower()
+            title = (driver.title or "").strip()
+            if url in ("about:blank", "chrome://newtab/") or (not url and not title):
+                driver.close()
+                closed += 1
+        except Exception:
+            continue
+    # Restore our original window if it still exists
+    if keep and keep in getattr(driver, "window_handles", []):
+        try:
+            driver.switch_to.window(keep)
+        except Exception:
+            pass
+    return closed
+def close_singleton_window() -> bool:
+    """Close the singleton window without quitting Chrome."""
+    ctx = get_context()
+    if ctx.driver is None or not ctx.target_id:
+        return False
+    closed = False
+    try:
+        ctx.driver.execute_cdp_cmd("Target.closeTarget", {"targetId": ctx.target_id})
+        closed = True
+    except Exception:
+        # Fallback
+        try:
+            h = _handle_for_target(ctx.driver, ctx.target_id)
+            if h:
+                ctx.driver.switch_to.window(h)
+                ctx.driver.close()
+                closed = True
+        except Exception:
+            pass
+    # Unregister window
+    if closed:
+        try:
+            owner = ensure_process_tag()
+            _unregister_window(owner)
+        except Exception as e:
+            logger.debug(f"Window unregistration failed (non-critical): {e}")
+    ctx.reset_window_state()
+    return closed
+def create_webdriver(debugger_host: str, debugger_port: int, config: dict) -> webdriver.Chrome:
+    from selenium.webdriver.chrome.options import Options
+    from selenium.webdriver.chrome.service import Service as ChromeService
+    options = Options()
+    chrome_path = config.get("chrome_path")
+    if chrome_path:
+        options.binary_location = chrome_path
+    options.add_experimental_option("debuggerAddress", f"{debugger_host}:{debugger_port}")
+    # Handle differing Selenium versions that accept log_output vs. log_path
+    log_file = chromedriver_log_path(config)
+    try:
+        service = ChromeService(log_output=log_file)  # newer Selenium
+    except TypeError:
+        service = ChromeService(log_path=log_file)    # older Selenium
+    driver = webdriver.Chrome(service=service, options=options)
+    return driver
+def _cleanup_own_blank_tabs(driver):
+    handle = getattr(driver, "current_window_handle", None)
+    try:
+        _close_extra_blank_windows_safe(
+            driver,
+            exclude_handles={handle} if handle else None,
+        )
+    except Exception:
+        pass
+def get_chromedriver_capability_version(driver: Optional[webdriver.Chrome] = None) -> Optional[str]:
+    """
+    Best effort Chromedriver version string.
+    - If a driver is provided, prefer driver.capabilities['chromedriverVersion'].
+    - Else, fall back to `chromedriver --version` if available in PATH.
+    """
+    try:
+        if driver:
+            v = driver.capabilities.get("chromedriverVersion")
+            if isinstance(v, str) and v:
+                # Typically like "114.0.5735.90 (some hash)"
+                return v.split(" ")[0]
+        path = shutil.which("chromedriver")
+        if path:
+            out = subprocess.check_output([path, "--version"], stderr=subprocess.STDOUT).decode().strip()
+            return out
+    except Exception:
+        pass
+    return None
+__all__ = [
+    'create_webdriver',
+    '_ensure_driver',
+    '_ensure_driver_and_window',
+    '_ensure_singleton_window',
+    'close_singleton_window',
+    '_cleanup_own_blank_tabs',
+    '_close_extra_blank_windows_safe',
+    'get_chromedriver_capability_version',
+    '_validate_window_context',
+    'ensure_process_tag',
+]

mcp_browser_use/browser/process.py ADDED Viewed

@@ -0,0 +1,133 @@
+"""Process and port management."""
+import os
+import json
+import time
+import socket
+import tempfile
+import psutil
+from typing import Optional, Tuple
+from ..constants import RENDEZVOUS_TTL_SEC
+from ..config.environment import profile_key
+def _is_port_open(host: str, port: int, timeout: float = 0.25) -> bool:
+    """Check if a port is open."""
+    try:
+        with socket.create_connection((host, port), timeout=timeout):
+            return True
+    except Exception:
+        return False
+def get_free_port() -> int:
+    """Get a free port by binding to port 0."""
+    with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+        s.bind(("127.0.0.1", 0))
+        return s.getsockname()[1]
+def make_process_tag() -> str:
+    """Create a unique process tag."""
+    import uuid
+    return f"agent:{uuid.uuid4().hex}"
+def ensure_process_tag() -> str:
+    """
+    Get or create the process tag for this session.
+    Uses the context to store the tag persistently across the session.
+    Returns:
+        The process tag string
+    """
+    from ..context import get_context
+    ctx = get_context()
+    if ctx.process_tag is None:
+        ctx.process_tag = make_process_tag()
+    return ctx.process_tag
+def _read_json(path: str) -> Optional[dict]:
+    """Read JSON file, return None on error."""
+    try:
+        with open(path, "r") as f:
+            return json.load(f)
+    except Exception:
+        return None
+def rendezvous_path(config: dict) -> str:
+    """Get path to rendezvous file for this profile."""
+    return os.path.join(tempfile.gettempdir(), f"mcp_chrome_rendezvous_{profile_key(config)}.json")
+def chromedriver_log_path(config: dict) -> str:
+    """Get path to chromedriver log file for this profile and process."""
+    return os.path.join(tempfile.gettempdir(), f"chromedriver_shared_{profile_key(config)}_{os.getpid()}.log")
+def read_rendezvous(config: dict) -> Tuple[Optional[int], Optional[int]]:
+    """
+    Read rendezvous file to find existing Chrome debug port and PID.
+    Returns:
+        Tuple of (port, pid) or (None, None) if not found/invalid
+    """
+    from .devtools import is_debugger_listening
+    path = rendezvous_path(config)
+    try:
+        if not os.path.exists(path):
+            return None, None
+        if (time.time() - os.path.getmtime(path)) > RENDEZVOUS_TTL_SEC:
+            return None, None
+        data = _read_json(path) or {}
+        port = int(data.get("port", 0)) or None
+        pid = int(data.get("pid", 0)) or None
+        if not port or not pid:
+            return None, None
+        if not psutil.pid_exists(pid):
+            return None, None
+        if not is_debugger_listening("127.0.0.1", port):
+            return None, None
+        return port, pid
+    except Exception:
+        return None, None
+def write_rendezvous(config: dict, port: int, pid: int) -> None:
+    """Write rendezvous file with Chrome debug port and PID."""
+    path = rendezvous_path(config)
+    tmp = path + ".tmp"
+    data = {"port": port, "pid": pid, "ts": time.time()}
+    try:
+        with open(tmp, "w") as f:
+            json.dump(data, f)
+        os.replace(tmp, path)
+    except Exception:
+        pass
+def clear_rendezvous(config: dict) -> None:
+    """Remove rendezvous file."""
+    try:
+        os.remove(rendezvous_path(config))
+    except Exception:
+        pass
+__all__ = [
+    '_is_port_open',
+    'get_free_port',
+    'make_process_tag',
+    '_read_json',
+    'read_rendezvous',
+    'write_rendezvous',
+    'clear_rendezvous',
+    'rendezvous_path',
+    'chromedriver_log_path',
+]