PyPI - sentienceapi - Versions diffs - 0.95.0__py3-none-any.whl - Mend

sentienceapi 0.95.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sentienceapi might be problematic. Click here for more details.

Files changed (82) hide show

sentience/__init__.py +253 -0
sentience/_extension_loader.py +195 -0
sentience/action_executor.py +215 -0
sentience/actions.py +1020 -0
sentience/agent.py +1181 -0
sentience/agent_config.py +46 -0
sentience/agent_runtime.py +424 -0
sentience/asserts/__init__.py +70 -0
sentience/asserts/expect.py +621 -0
sentience/asserts/query.py +383 -0
sentience/async_api.py +108 -0
sentience/backends/__init__.py +137 -0
sentience/backends/actions.py +343 -0
sentience/backends/browser_use_adapter.py +241 -0
sentience/backends/cdp_backend.py +393 -0
sentience/backends/exceptions.py +211 -0
sentience/backends/playwright_backend.py +194 -0
sentience/backends/protocol.py +216 -0
sentience/backends/sentience_context.py +469 -0
sentience/backends/snapshot.py +427 -0
sentience/base_agent.py +196 -0
sentience/browser.py +1215 -0
sentience/browser_evaluator.py +299 -0
sentience/canonicalization.py +207 -0
sentience/cli.py +130 -0
sentience/cloud_tracing.py +807 -0
sentience/constants.py +6 -0
sentience/conversational_agent.py +543 -0
sentience/element_filter.py +136 -0
sentience/expect.py +188 -0
sentience/extension/background.js +104 -0
sentience/extension/content.js +161 -0
sentience/extension/injected_api.js +914 -0
sentience/extension/manifest.json +36 -0
sentience/extension/pkg/sentience_core.d.ts +51 -0
sentience/extension/pkg/sentience_core.js +323 -0
sentience/extension/pkg/sentience_core_bg.wasm +0 -0
sentience/extension/pkg/sentience_core_bg.wasm.d.ts +10 -0
sentience/extension/release.json +115 -0
sentience/formatting.py +15 -0
sentience/generator.py +202 -0
sentience/inspector.py +367 -0
sentience/llm_interaction_handler.py +191 -0
sentience/llm_provider.py +875 -0
sentience/llm_provider_utils.py +120 -0
sentience/llm_response_builder.py +153 -0
sentience/models.py +846 -0
sentience/ordinal.py +280 -0
sentience/overlay.py +222 -0
sentience/protocols.py +228 -0
sentience/query.py +303 -0
sentience/read.py +188 -0
sentience/recorder.py +589 -0
sentience/schemas/trace_v1.json +335 -0
sentience/screenshot.py +100 -0
sentience/sentience_methods.py +86 -0
sentience/snapshot.py +706 -0
sentience/snapshot_diff.py +126 -0
sentience/text_search.py +262 -0
sentience/trace_event_builder.py +148 -0
sentience/trace_file_manager.py +197 -0
sentience/trace_indexing/__init__.py +27 -0
sentience/trace_indexing/index_schema.py +199 -0
sentience/trace_indexing/indexer.py +414 -0
sentience/tracer_factory.py +322 -0
sentience/tracing.py +449 -0
sentience/utils/__init__.py +40 -0
sentience/utils/browser.py +46 -0
sentience/utils/element.py +257 -0
sentience/utils/formatting.py +59 -0
sentience/utils.py +296 -0
sentience/verification.py +380 -0
sentience/visual_agent.py +2058 -0
sentience/wait.py +139 -0
sentienceapi-0.95.0.dist-info/METADATA +984 -0
sentienceapi-0.95.0.dist-info/RECORD +82 -0
sentienceapi-0.95.0.dist-info/WHEEL +5 -0
sentienceapi-0.95.0.dist-info/entry_points.txt +2 -0
sentienceapi-0.95.0.dist-info/licenses/LICENSE +24 -0
sentienceapi-0.95.0.dist-info/licenses/LICENSE-APACHE +201 -0
sentienceapi-0.95.0.dist-info/licenses/LICENSE-MIT +21 -0
sentienceapi-0.95.0.dist-info/top_level.txt +1 -0

sentience/backends/actions.py ADDED Viewed

@@ -0,0 +1,343 @@
+"""
+Backend-agnostic actions for browser-use integration.
+These actions work with any BrowserBackend implementation,
+enabling Sentience grounding with browser-use or other frameworks.
+Usage with browser-use:
+    from sentience.backends import BrowserUseAdapter
+    from sentience.backends.actions import click, type_text, scroll
+    adapter = BrowserUseAdapter(session)
+    backend = await adapter.create_backend()
+    # Take snapshot and click element
+    snap = await snapshot_from_backend(backend)
+    element = find(snap, 'role=button[name="Submit"]')
+    await click(backend, element.bbox)
+"""
+import asyncio
+import time
+from typing import TYPE_CHECKING, Any, Literal
+from ..models import ActionResult, BBox, Snapshot
+if TYPE_CHECKING:
+    from .protocol import BrowserBackend
+async def click(
+    backend: "BrowserBackend",
+    target: BBox | dict[str, float] | tuple[float, float],
+    button: Literal["left", "right", "middle"] = "left",
+    click_count: int = 1,
+    move_first: bool = True,
+) -> ActionResult:
+    """
+    Click at coordinates using the backend.
+    Args:
+        backend: BrowserBackend implementation
+        target: Click target - BBox (clicks center), dict with x/y, or (x, y) tuple
+        button: Mouse button to click
+        click_count: Number of clicks (1=single, 2=double)
+        move_first: Whether to move mouse to position before clicking
+    Returns:
+        ActionResult with success status
+    Example:
+        # Click at coordinates
+        await click(backend, (100, 200))
+        # Click element bbox center
+        await click(backend, element.bbox)
+        # Double-click
+        await click(backend, element.bbox, click_count=2)
+    """
+    start_time = time.time()
+    # Resolve coordinates
+    x, y = _resolve_coordinates(target)
+    try:
+        # Optional mouse move for hover effects
+        if move_first:
+            await backend.mouse_move(x, y)
+            await asyncio.sleep(0.02)  # Brief pause for hover
+        # Perform click
+        await backend.mouse_click(x, y, button=button, click_count=click_count)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "click_failed", "reason": str(e)},
+        )
+async def type_text(
+    backend: "BrowserBackend",
+    text: str,
+    target: BBox | dict[str, float] | tuple[float, float] | None = None,
+    clear_first: bool = False,
+) -> ActionResult:
+    """
+    Type text, optionally clicking a target first.
+    Args:
+        backend: BrowserBackend implementation
+        text: Text to type
+        target: Optional click target before typing (BBox, dict, or tuple)
+        clear_first: If True, select all and delete before typing
+    Returns:
+        ActionResult with success status
+    Example:
+        # Type into focused element
+        await type_text(backend, "Hello World")
+        # Click input then type
+        await type_text(backend, "search query", target=search_box.bbox)
+        # Clear and type
+        await type_text(backend, "new value", target=input.bbox, clear_first=True)
+    """
+    start_time = time.time()
+    try:
+        # Click target if provided
+        if target is not None:
+            x, y = _resolve_coordinates(target)
+            await backend.mouse_click(x, y)
+            await asyncio.sleep(0.05)  # Wait for focus
+        # Clear existing content if requested
+        if clear_first:
+            # Select all (Ctrl+A / Cmd+A) and delete
+            await backend.eval("document.execCommand('selectAll')")
+            await asyncio.sleep(0.02)
+        # Type the text
+        await backend.type_text(text)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "type_failed", "reason": str(e)},
+        )
+async def scroll(
+    backend: "BrowserBackend",
+    delta_y: float = 300,
+    target: BBox | dict[str, float] | tuple[float, float] | None = None,
+) -> ActionResult:
+    """
+    Scroll the page or element.
+    Args:
+        backend: BrowserBackend implementation
+        delta_y: Scroll amount (positive=down, negative=up)
+        target: Optional position for scroll (defaults to viewport center)
+    Returns:
+        ActionResult with success status
+    Example:
+        # Scroll down 300px
+        await scroll(backend, 300)
+        # Scroll up 500px
+        await scroll(backend, -500)
+        # Scroll at specific position
+        await scroll(backend, 200, target=(500, 300))
+    """
+    start_time = time.time()
+    try:
+        x: float | None = None
+        y: float | None = None
+        if target is not None:
+            x, y = _resolve_coordinates(target)
+        await backend.wheel(delta_y=delta_y, x=x, y=y)
+        # Wait for scroll to settle
+        await asyncio.sleep(0.1)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "scroll_failed", "reason": str(e)},
+        )
+async def scroll_to_element(
+    backend: "BrowserBackend",
+    element_id: int,
+    behavior: Literal["smooth", "instant", "auto"] = "instant",
+    block: Literal["start", "center", "end", "nearest"] = "center",
+) -> ActionResult:
+    """
+    Scroll element into view using JavaScript scrollIntoView.
+    Args:
+        backend: BrowserBackend implementation
+        element_id: Element ID from snapshot (requires sentience_registry)
+        behavior: Scroll behavior
+        block: Vertical alignment
+    Returns:
+        ActionResult with success status
+    """
+    start_time = time.time()
+    try:
+        scrolled = await backend.eval(
+            f"""
+            (() => {{
+                const el = window.sentience_registry && window.sentience_registry[{element_id}];
+                if (el && el.scrollIntoView) {{
+                    el.scrollIntoView({{
+                        behavior: '{behavior}',
+                        block: '{block}',
+                        inline: 'nearest'
+                    }});
+                    return true;
+                }}
+                return false;
+            }})()
+        """
+        )
+        # Wait for scroll animation
+        wait_time = 0.3 if behavior == "smooth" else 0.05
+        await asyncio.sleep(wait_time)
+        duration_ms = int((time.time() - start_time) * 1000)
+        if scrolled:
+            return ActionResult(
+                success=True,
+                duration_ms=duration_ms,
+                outcome="dom_updated",
+            )
+        else:
+            return ActionResult(
+                success=False,
+                duration_ms=duration_ms,
+                outcome="error",
+                error={"code": "scroll_failed", "reason": "Element not found in registry"},
+            )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "scroll_failed", "reason": str(e)},
+        )
+async def wait_for_stable(
+    backend: "BrowserBackend",
+    state: Literal["interactive", "complete"] = "complete",
+    timeout_ms: int = 10000,
+) -> ActionResult:
+    """
+    Wait for page to reach stable state.
+    Args:
+        backend: BrowserBackend implementation
+        state: Target document.readyState
+        timeout_ms: Maximum wait time
+    Returns:
+        ActionResult with success status
+    """
+    start_time = time.time()
+    try:
+        await backend.wait_ready_state(state=state, timeout_ms=timeout_ms)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except TimeoutError as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "timeout", "reason": str(e)},
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "wait_failed", "reason": str(e)},
+        )
+def _resolve_coordinates(
+    target: BBox | dict[str, float] | tuple[float, float],
+) -> tuple[float, float]:
+    """
+    Resolve target to (x, y) coordinates.
+    - BBox: Returns center point
+    - dict: Returns x, y keys (or center if width/height present)
+    - tuple: Returns as-is
+    """
+    if isinstance(target, BBox):
+        return (target.x + target.width / 2, target.y + target.height / 2)
+    elif isinstance(target, tuple):
+        return target
+    elif isinstance(target, dict):
+        # If has width/height, compute center
+        if "width" in target and "height" in target:
+            x = target.get("x", 0) + target["width"] / 2
+            y = target.get("y", 0) + target["height"] / 2
+            return (x, y)
+        # Otherwise use x/y directly
+        return (target.get("x", 0), target.get("y", 0))
+    else:
+        raise ValueError(f"Invalid target type: {type(target)}")

sentience/backends/browser_use_adapter.py ADDED Viewed

@@ -0,0 +1,241 @@
+"""
+Browser-use adapter for Sentience SDK.
+This module provides BrowserUseAdapter which wraps browser-use's BrowserSession
+and provides a CDPBackendV0 for Sentience operations.
+Usage:
+    from browser_use import BrowserSession, BrowserProfile
+    from sentience import get_extension_dir
+    from sentience.backends import BrowserUseAdapter
+    # Create browser-use session with Sentience extension
+    profile = BrowserProfile(args=[f"--load-extension={get_extension_dir()}"])
+    session = BrowserSession(browser_profile=profile)
+    await session.start()
+    # Create Sentience adapter
+    adapter = BrowserUseAdapter(session)
+    backend = await adapter.create_backend()
+    # Use backend for Sentience operations
+    viewport = await backend.refresh_page_info()
+    await backend.mouse_click(100, 200)
+"""
+from typing import TYPE_CHECKING, Any
+from .cdp_backend import CDPBackendV0, CDPTransport
+if TYPE_CHECKING:
+    # Import browser-use types only for type checking
+    # This avoids requiring browser-use as a hard dependency
+    pass
+class BrowserUseCDPTransport(CDPTransport):
+    """
+    CDP transport implementation for browser-use.
+    Wraps browser-use's CDP client to provide the CDPTransport interface.
+    Uses cdp-use library pattern: cdp_client.send.Domain.method(params={}, session_id=)
+    """
+    def __init__(self, cdp_client: Any, session_id: str) -> None:
+        """
+        Initialize transport with browser-use CDP client.
+        Args:
+            cdp_client: browser-use's CDP client (from cdp_session.cdp_client)
+            session_id: CDP session ID (from cdp_session.session_id)
+        """
+        self._client = cdp_client
+        self._session_id = session_id
+    async def send(self, method: str, params: dict | None = None) -> dict:
+        """
+        Send CDP command using browser-use's cdp-use client.
+        Translates method name like "Runtime.evaluate" to
+        cdp_client.send.Runtime.evaluate(params={...}, session_id=...).
+        Args:
+            method: CDP method name, e.g., "Runtime.evaluate"
+            params: Method parameters
+        Returns:
+            CDP response dict
+        """
+        # Split method into domain and method name
+        # e.g., "Runtime.evaluate" -> ("Runtime", "evaluate")
+        parts = method.split(".", 1)
+        if len(parts) != 2:
+            raise ValueError(f"Invalid CDP method format: {method}")
+        domain_name, method_name = parts
+        # Get the domain object from cdp_client.send
+        domain = getattr(self._client.send, domain_name, None)
+        if domain is None:
+            raise ValueError(f"Unknown CDP domain: {domain_name}")
+        # Get the method from the domain
+        method_func = getattr(domain, method_name, None)
+        if method_func is None:
+            raise ValueError(f"Unknown CDP method: {method}")
+        # Call the method with params and session_id
+        result = await method_func(
+            params=params or {},
+            session_id=self._session_id,
+        )
+        # cdp-use returns the result directly or None
+        return result if result is not None else {}
+class BrowserUseAdapter:
+    """
+    Adapter to use Sentience with browser-use's BrowserSession.
+    This adapter:
+    1. Wraps browser-use's CDP client with BrowserUseCDPTransport
+    2. Creates CDPBackendV0 for Sentience operations
+    3. Provides access to the underlying page for extension calls
+    Example:
+        from browser_use import BrowserSession, BrowserProfile
+        from sentience import get_extension_dir, snapshot_async, SnapshotOptions
+        from sentience.backends import BrowserUseAdapter
+        # Setup browser-use with Sentience extension
+        profile = BrowserProfile(args=[f"--load-extension={get_extension_dir()}"])
+        session = BrowserSession(browser_profile=profile)
+        await session.start()
+        # Create adapter and backend
+        adapter = BrowserUseAdapter(session)
+        backend = await adapter.create_backend()
+        # Navigate (using browser-use)
+        page = await session.get_current_page()
+        await page.goto("https://example.com")
+        # Take Sentience snapshot (uses extension)
+        snap = await snapshot_async(adapter, SnapshotOptions())
+        # Use backend for precise clicking
+        await backend.mouse_click(snap.elements[0].bbox.x, snap.elements[0].bbox.y)
+    """
+    def __init__(self, session: Any) -> None:
+        """
+        Initialize adapter with browser-use BrowserSession.
+        Args:
+            session: browser-use BrowserSession instance
+        """
+        self._session = session
+        self._backend: CDPBackendV0 | None = None
+        self._transport: BrowserUseCDPTransport | None = None
+    @property
+    def page(self) -> Any:
+        """
+        Get the current Playwright page from browser-use.
+        This is needed for Sentience snapshot() which calls window.sentience.snapshot().
+        Returns:
+            Playwright Page object
+        """
+        # browser-use stores page in session
+        # Access pattern may vary by browser-use version
+        if hasattr(self._session, "page"):
+            return self._session.page
+        if hasattr(self._session, "_page"):
+            return self._session._page
+        if hasattr(self._session, "get_current_page"):
+            # This is async, but we need sync access for property
+            # Caller should use get_page_async() instead
+            raise RuntimeError("Use await adapter.get_page_async() to get the page")
+        raise RuntimeError("Could not find page in browser-use session")
+    async def get_page_async(self) -> Any:
+        """
+        Get the current Playwright page (async).
+        Returns:
+            Playwright Page object
+        """
+        if hasattr(self._session, "get_current_page"):
+            return await self._session.get_current_page()
+        return self.page
+    @property
+    def api_key(self) -> str | None:
+        """
+        API key for Sentience API (for snapshot compatibility).
+        Returns None since browser-use users pass api_key via SnapshotOptions.
+        """
+        return None
+    @property
+    def api_url(self) -> str | None:
+        """
+        API URL for Sentience API (for snapshot compatibility).
+        Returns None to use default.
+        """
+        return None
+    async def create_backend(self) -> CDPBackendV0:
+        """
+        Create CDP backend for Sentience operations.
+        This method:
+        1. Gets or creates a CDP session from browser-use
+        2. Creates BrowserUseCDPTransport to wrap the CDP client
+        3. Creates CDPBackendV0 with the transport
+        Returns:
+            CDPBackendV0 instance ready for use
+        Raises:
+            RuntimeError: If CDP session cannot be created
+        """
+        if self._backend is not None:
+            return self._backend
+        # Get CDP session from browser-use
+        # browser-use uses: cdp_session = await session.get_or_create_cdp_session()
+        if not hasattr(self._session, "get_or_create_cdp_session"):
+            raise RuntimeError(
+                "browser-use session does not have get_or_create_cdp_session method. "
+                "Make sure you're using a compatible version of browser-use."
+            )
+        cdp_session = await self._session.get_or_create_cdp_session()
+        # Extract CDP client and session ID
+        cdp_client = cdp_session.cdp_client
+        session_id = cdp_session.session_id
+        # Create transport and backend
+        self._transport = BrowserUseCDPTransport(cdp_client, session_id)
+        self._backend = CDPBackendV0(self._transport)
+        return self._backend
+    async def get_transport(self) -> BrowserUseCDPTransport:
+        """
+        Get the CDP transport (creates backend if needed).
+        Returns:
+            BrowserUseCDPTransport instance
+        """
+        if self._transport is None:
+            await self.create_backend()
+        assert self._transport is not None
+        return self._transport