PyPI - sentienceapi - Versions diffs - 0.92.2__py3-none-any.whl → 0.98.0__py3-none-any.whl - Mend

sentienceapi 0.92.2py3-none-any.whl → 0.98.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sentienceapi might be problematic. Click here for more details.

Files changed (64) hide show

sentience/__init__.py +107 -2
sentience/_extension_loader.py +156 -1
sentience/action_executor.py +2 -0
sentience/actions.py +354 -9
sentience/agent.py +4 -0
sentience/agent_runtime.py +840 -0
sentience/asserts/__init__.py +70 -0
sentience/asserts/expect.py +621 -0
sentience/asserts/query.py +383 -0
sentience/async_api.py +8 -1
sentience/backends/__init__.py +137 -0
sentience/backends/actions.py +372 -0
sentience/backends/browser_use_adapter.py +241 -0
sentience/backends/cdp_backend.py +393 -0
sentience/backends/exceptions.py +211 -0
sentience/backends/playwright_backend.py +194 -0
sentience/backends/protocol.py +216 -0
sentience/backends/sentience_context.py +469 -0
sentience/backends/snapshot.py +483 -0
sentience/browser.py +230 -74
sentience/canonicalization.py +207 -0
sentience/cloud_tracing.py +65 -24
sentience/constants.py +6 -0
sentience/cursor_policy.py +142 -0
sentience/extension/content.js +35 -0
sentience/extension/injected_api.js +310 -15
sentience/extension/manifest.json +1 -1
sentience/extension/pkg/sentience_core.d.ts +22 -22
sentience/extension/pkg/sentience_core.js +192 -144
sentience/extension/pkg/sentience_core_bg.wasm +0 -0
sentience/extension/release.json +29 -29
sentience/failure_artifacts.py +241 -0
sentience/integrations/__init__.py +6 -0
sentience/integrations/langchain/__init__.py +12 -0
sentience/integrations/langchain/context.py +18 -0
sentience/integrations/langchain/core.py +326 -0
sentience/integrations/langchain/tools.py +180 -0
sentience/integrations/models.py +46 -0
sentience/integrations/pydanticai/__init__.py +15 -0
sentience/integrations/pydanticai/deps.py +20 -0
sentience/integrations/pydanticai/toolset.py +468 -0
sentience/llm_provider.py +695 -18
sentience/models.py +536 -3
sentience/ordinal.py +280 -0
sentience/query.py +66 -4
sentience/schemas/trace_v1.json +27 -1
sentience/snapshot.py +384 -93
sentience/snapshot_diff.py +39 -54
sentience/text_search.py +1 -0
sentience/trace_event_builder.py +20 -1
sentience/trace_indexing/indexer.py +3 -49
sentience/tracer_factory.py +1 -3
sentience/verification.py +618 -0
sentience/visual_agent.py +3 -1
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/METADATA +198 -40
sentienceapi-0.98.0.dist-info/RECORD +92 -0
sentience/utils.py +0 -296
sentienceapi-0.92.2.dist-info/RECORD +0 -65
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/WHEEL +0 -0
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/entry_points.txt +0 -0
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE +0 -0
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-APACHE +0 -0
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-MIT +0 -0
{sentienceapi-0.92.2.dist-info → sentienceapi-0.98.0.dist-info}/top_level.txt +0 -0

sentience/backends/cdp_backend.py ADDED Viewed

@@ -0,0 +1,393 @@
+"""
+CDP Backend implementation for browser-use integration.
+This module provides CDPBackendV0, which implements BrowserBackend protocol
+using Chrome DevTools Protocol (CDP) commands.
+Usage with browser-use:
+    from browser_use import BrowserSession
+    from sentience.backends import CDPBackendV0
+    from sentience.backends.browser_use_adapter import BrowserUseAdapter
+    session = BrowserSession(...)
+    await session.start()
+    adapter = BrowserUseAdapter(session)
+    backend = await adapter.create_backend()
+    # Now use backend for Sentience operations
+    viewport = await backend.refresh_page_info()
+    await backend.mouse_click(100, 200)
+"""
+import asyncio
+import base64
+import time
+from typing import Any, Literal, Protocol, runtime_checkable
+from .protocol import BrowserBackend, LayoutMetrics, ViewportInfo
+@runtime_checkable
+class CDPTransport(Protocol):
+    """
+    Protocol for CDP transport layer.
+    This abstracts the actual CDP communication, allowing different
+    implementations (browser-use, Playwright CDP, raw WebSocket).
+    """
+    async def send(self, method: str, params: dict | None = None) -> dict:
+        """
+        Send a CDP command and return the result.
+        Args:
+            method: CDP method name, e.g., "Runtime.evaluate"
+            params: Method parameters
+        Returns:
+            CDP response dict
+        """
+        ...
+class CDPBackendV0:
+    """
+    CDP-based implementation of BrowserBackend.
+    This backend uses CDP commands to interact with the browser,
+    making it compatible with browser-use's CDP client.
+    """
+    def __init__(self, transport: CDPTransport) -> None:
+        """
+        Initialize CDP backend.
+        Args:
+            transport: CDP transport for sending commands
+        """
+        self._transport = transport
+        self._cached_viewport: ViewportInfo | None = None
+        self._execution_context_id: int | None = None
+    async def _get_execution_context(self) -> int:
+        """Get or create execution context ID for Runtime.callFunctionOn."""
+        if self._execution_context_id is not None:
+            return self._execution_context_id
+        # Enable Runtime domain if not already enabled
+        try:
+            await self._transport.send("Runtime.enable")
+        except Exception:
+            pass  # May already be enabled
+        # Get the main frame's execution context
+        result = await self._transport.send(
+            "Runtime.evaluate",
+            {
+                "expression": "1",
+                "returnByValue": True,
+            },
+        )
+        # Extract context ID from the result
+        if "executionContextId" in result:
+            self._execution_context_id = result["executionContextId"]
+        else:
+            # Fallback: use context ID 1 (main frame)
+            self._execution_context_id = 1
+        return self._execution_context_id
+    async def refresh_page_info(self) -> ViewportInfo:
+        """Cache viewport + scroll offsets; cheap & safe to call often."""
+        result = await self.eval(
+            """(() => ({
+                width: window.innerWidth,
+                height: window.innerHeight,
+                scroll_x: window.scrollX,
+                scroll_y: window.scrollY,
+                content_width: document.documentElement.scrollWidth,
+                content_height: document.documentElement.scrollHeight
+            }))()"""
+        )
+        self._cached_viewport = ViewportInfo(
+            width=result.get("width", 0),
+            height=result.get("height", 0),
+            scroll_x=result.get("scroll_x", 0),
+            scroll_y=result.get("scroll_y", 0),
+            content_width=result.get("content_width"),
+            content_height=result.get("content_height"),
+        )
+        return self._cached_viewport
+    async def eval(self, expression: str) -> Any:
+        """Evaluate JavaScript expression using Runtime.evaluate."""
+        result = await self._transport.send(
+            "Runtime.evaluate",
+            {
+                "expression": expression,
+                "returnByValue": True,
+                "awaitPromise": True,
+            },
+        )
+        # Check for exceptions
+        if "exceptionDetails" in result:
+            exc = result["exceptionDetails"]
+            text = exc.get("text", "Unknown error")
+            raise RuntimeError(f"JavaScript evaluation failed: {text}")
+        # Extract value from result
+        if "result" in result:
+            res = result["result"]
+            if res.get("type") == "undefined":
+                return None
+            return res.get("value")
+        return None
+    async def call(
+        self,
+        function_declaration: str,
+        args: list[Any] | None = None,
+    ) -> Any:
+        """Call JavaScript function using Runtime.callFunctionOn."""
+        # Build call arguments
+        call_args = []
+        if args:
+            for arg in args:
+                if arg is None:
+                    call_args.append({"value": None})
+                elif isinstance(arg, bool):
+                    call_args.append({"value": arg})
+                elif isinstance(arg, (int, float)):
+                    call_args.append({"value": arg})
+                elif isinstance(arg, str):
+                    call_args.append({"value": arg})
+                elif isinstance(arg, dict):
+                    call_args.append({"value": arg})
+                elif isinstance(arg, list):
+                    call_args.append({"value": arg})
+                else:
+                    # Serialize complex objects to JSON
+                    call_args.append({"value": str(arg)})
+        # We need an object ID to call function on
+        # Use globalThis (window) as the target
+        global_result = await self._transport.send(
+            "Runtime.evaluate",
+            {
+                "expression": "globalThis",
+                "returnByValue": False,
+            },
+        )
+        object_id = global_result.get("result", {}).get("objectId")
+        if not object_id:
+            # Fallback: evaluate the function directly
+            if args:
+                args_json = ", ".join(repr(a) if isinstance(a, str) else str(a) for a in args)
+                expression = f"({function_declaration})({args_json})"
+            else:
+                expression = f"({function_declaration})()"
+            return await self.eval(expression)
+        result = await self._transport.send(
+            "Runtime.callFunctionOn",
+            {
+                "functionDeclaration": function_declaration,
+                "objectId": object_id,
+                "arguments": call_args,
+                "returnByValue": True,
+                "awaitPromise": True,
+            },
+        )
+        # Check for exceptions
+        if "exceptionDetails" in result:
+            exc = result["exceptionDetails"]
+            text = exc.get("text", "Unknown error")
+            raise RuntimeError(f"JavaScript call failed: {text}")
+        # Extract value from result
+        if "result" in result:
+            res = result["result"]
+            if res.get("type") == "undefined":
+                return None
+            return res.get("value")
+        return None
+    async def get_layout_metrics(self) -> LayoutMetrics:
+        """Get page layout metrics using Page.getLayoutMetrics."""
+        result = await self._transport.send("Page.getLayoutMetrics")
+        # Extract metrics from result
+        layout_viewport = result.get("layoutViewport", {})
+        content_size = result.get("contentSize", {})
+        visual_viewport = result.get("visualViewport", {})
+        return LayoutMetrics(
+            viewport_x=visual_viewport.get("pageX", 0),
+            viewport_y=visual_viewport.get("pageY", 0),
+            viewport_width=visual_viewport.get(
+                "clientWidth", layout_viewport.get("clientWidth", 0)
+            ),
+            viewport_height=visual_viewport.get(
+                "clientHeight", layout_viewport.get("clientHeight", 0)
+            ),
+            content_width=content_size.get("width", 0),
+            content_height=content_size.get("height", 0),
+            device_scale_factor=visual_viewport.get("scale", 1.0),
+        )
+    async def screenshot_png(self) -> bytes:
+        """Capture viewport screenshot as PNG bytes."""
+        result = await self._transport.send(
+            "Page.captureScreenshot",
+            {
+                "format": "png",
+                "captureBeyondViewport": False,
+            },
+        )
+        data = result.get("data", "")
+        return base64.b64decode(data)
+    async def mouse_move(self, x: float, y: float) -> None:
+        """Move mouse to viewport coordinates."""
+        await self._transport.send(
+            "Input.dispatchMouseEvent",
+            {
+                "type": "mouseMoved",
+                "x": x,
+                "y": y,
+            },
+        )
+    async def mouse_click(
+        self,
+        x: float,
+        y: float,
+        button: Literal["left", "right", "middle"] = "left",
+        click_count: int = 1,
+    ) -> None:
+        """Click at viewport coordinates."""
+        # Mouse down
+        await self._transport.send(
+            "Input.dispatchMouseEvent",
+            {
+                "type": "mousePressed",
+                "x": x,
+                "y": y,
+                "button": button,
+                "clickCount": click_count,
+            },
+        )
+        # Small delay between press and release
+        await asyncio.sleep(0.05)
+        # Mouse up
+        await self._transport.send(
+            "Input.dispatchMouseEvent",
+            {
+                "type": "mouseReleased",
+                "x": x,
+                "y": y,
+                "button": button,
+                "clickCount": click_count,
+            },
+        )
+    async def wheel(
+        self,
+        delta_y: float,
+        x: float | None = None,
+        y: float | None = None,
+    ) -> None:
+        """Scroll using mouse wheel."""
+        # Get viewport center if coordinates not provided
+        if x is None or y is None:
+            if self._cached_viewport is None:
+                await self.refresh_page_info()
+            assert self._cached_viewport is not None
+            x = x if x is not None else self._cached_viewport.width / 2
+            y = y if y is not None else self._cached_viewport.height / 2
+        await self._transport.send(
+            "Input.dispatchMouseEvent",
+            {
+                "type": "mouseWheel",
+                "x": x,
+                "y": y,
+                "deltaX": 0,
+                "deltaY": delta_y,
+            },
+        )
+    async def type_text(self, text: str) -> None:
+        """Type text using keyboard input."""
+        for char in text:
+            # Key down
+            await self._transport.send(
+                "Input.dispatchKeyEvent",
+                {
+                    "type": "keyDown",
+                    "text": char,
+                },
+            )
+            # Char event (for text input)
+            await self._transport.send(
+                "Input.dispatchKeyEvent",
+                {
+                    "type": "char",
+                    "text": char,
+                },
+            )
+            # Key up
+            await self._transport.send(
+                "Input.dispatchKeyEvent",
+                {
+                    "type": "keyUp",
+                    "text": char,
+                },
+            )
+            # Small delay between characters
+            await asyncio.sleep(0.01)
+    async def wait_ready_state(
+        self,
+        state: Literal["interactive", "complete"] = "interactive",
+        timeout_ms: int = 15000,
+    ) -> None:
+        """Wait for document.readyState using polling."""
+        start = time.monotonic()
+        timeout_sec = timeout_ms / 1000.0
+        # Map state to acceptable states
+        acceptable_states = {"complete"} if state == "complete" else {"interactive", "complete"}
+        while True:
+            elapsed = time.monotonic() - start
+            if elapsed >= timeout_sec:
+                raise TimeoutError(
+                    f"Timed out waiting for document.readyState='{state}' " f"after {timeout_ms}ms"
+                )
+            current_state = await self.eval("document.readyState")
+            if current_state in acceptable_states:
+                return
+            # Poll every 100ms
+            await asyncio.sleep(0.1)
+    async def get_url(self) -> str:
+        """Get current page URL."""
+        result = await self.eval("window.location.href")
+        return result if result else ""

sentience/backends/exceptions.py ADDED Viewed

@@ -0,0 +1,211 @@
+"""
+Custom exceptions for Sentience backends.
+These exceptions provide clear, actionable error messages when things go wrong
+during browser-use integration or backend operations.
+"""
+from dataclasses import dataclass
+from typing import Any
+class SentienceBackendError(Exception):
+    """Base exception for all Sentience backend errors."""
+    pass
+@dataclass
+class ExtensionDiagnostics:
+    """Diagnostics collected when extension loading fails."""
+    sentience_defined: bool = False
+    sentience_snapshot: bool = False
+    url: str = ""
+    error: str | None = None
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "ExtensionDiagnostics":
+        """Create from diagnostic dict returned by browser eval."""
+        return cls(
+            sentience_defined=data.get("sentience_defined", False),
+            sentience_snapshot=data.get("sentience_snapshot", False),
+            url=data.get("url", ""),
+            error=data.get("error"),
+        )
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to dict for serialization."""
+        return {
+            "sentience_defined": self.sentience_defined,
+            "sentience_snapshot": self.sentience_snapshot,
+            "url": self.url,
+            "error": self.error,
+        }
+class ExtensionNotLoadedError(SentienceBackendError):
+    """
+    Raised when the Sentience extension is not loaded in the browser.
+    This typically means:
+    1. Browser was launched without --load-extension flag
+    2. Extension path is incorrect
+    3. Extension failed to initialize
+    Example fix for browser-use:
+        from sentience import get_extension_dir
+        from browser_use import BrowserSession, BrowserProfile
+        profile = BrowserProfile(
+            args=[f"--load-extension={get_extension_dir()}"],
+        )
+        session = BrowserSession(browser_profile=profile)
+    """
+    def __init__(
+        self,
+        message: str,
+        timeout_ms: int | None = None,
+        diagnostics: ExtensionDiagnostics | None = None,
+    ) -> None:
+        self.timeout_ms = timeout_ms
+        self.diagnostics = diagnostics
+        super().__init__(message)
+    @classmethod
+    def from_timeout(
+        cls,
+        timeout_ms: int,
+        diagnostics: ExtensionDiagnostics | None = None,
+    ) -> "ExtensionNotLoadedError":
+        """Create error from timeout during extension wait."""
+        diag_info = ""
+        if diagnostics:
+            if diagnostics.error:
+                diag_info = f"\n  Error: {diagnostics.error}"
+            else:
+                diag_info = (
+                    f"\n  window.sentience defined: {diagnostics.sentience_defined}"
+                    f"\n  window.sentience.snapshot available: {diagnostics.sentience_snapshot}"
+                    f"\n  Page URL: {diagnostics.url}"
+                )
+        message = (
+            f"Sentience extension not loaded after {timeout_ms}ms.{diag_info}\n\n"
+            "To fix this, ensure the extension is loaded when launching the browser:\n\n"
+            "  from sentience import get_extension_dir\n"
+            "  from browser_use import BrowserSession, BrowserProfile\n\n"
+            "  profile = BrowserProfile(\n"
+            f'      args=[f"--load-extension={{get_extension_dir()}}"],\n'
+            "  )\n"
+            "  session = BrowserSession(browser_profile=profile)\n"
+        )
+        return cls(message, timeout_ms=timeout_ms, diagnostics=diagnostics)
+class ExtensionInjectionError(SentienceBackendError):
+    """
+    Raised when window.sentience API is not available on the page.
+    This can happen when:
+    1. Page loaded before extension could inject
+    2. Page has Content Security Policy blocking extension
+    3. Extension crashed or was disabled
+    Call snapshot() with a longer timeout or wait for page load.
+    """
+    def __init__(
+        self,
+        message: str,
+        url: str | None = None,
+    ) -> None:
+        self.url = url
+        super().__init__(message)
+    @classmethod
+    def from_page(cls, url: str) -> "ExtensionInjectionError":
+        """Create error for a specific page."""
+        message = (
+            f"window.sentience API not available on page: {url}\n\n"
+            "Possible causes:\n"
+            "  1. Page loaded before extension could inject (try increasing timeout)\n"
+            "  2. Page has Content Security Policy blocking the extension\n"
+            "  3. Extension was disabled or crashed\n\n"
+            "Try:\n"
+            "  snap = await snapshot(backend, options=SnapshotOptions(timeout_ms=10000))"
+        )
+        return cls(message, url=url)
+class BackendEvalError(SentienceBackendError):
+    """
+    Raised when JavaScript evaluation fails in the browser.
+    This wraps underlying CDP or Playwright errors with context.
+    """
+    def __init__(
+        self,
+        message: str,
+        expression: str | None = None,
+        original_error: Exception | None = None,
+    ) -> None:
+        self.expression = expression
+        self.original_error = original_error
+        super().__init__(message)
+class SnapshotError(SentienceBackendError):
+    """
+    Raised when taking a snapshot fails.
+    This can happen when:
+    1. Extension returned null or invalid data
+    2. Page is in an invalid state
+    3. Extension threw an error
+    """
+    def __init__(
+        self,
+        message: str,
+        url: str | None = None,
+        raw_result: Any = None,
+    ) -> None:
+        self.url = url
+        self.raw_result = raw_result
+        super().__init__(message)
+    @classmethod
+    def from_null_result(cls, url: str | None = None) -> "SnapshotError":
+        """Create error for null snapshot result."""
+        message = (
+            "window.sentience.snapshot() returned null.\n\n"
+            "Possible causes:\n"
+            "  1. Extension is not properly initialized\n"
+            "  2. Page DOM is in an invalid state\n"
+            "  3. Extension encountered an internal error\n\n"
+            "Try refreshing the page and taking a new snapshot."
+        )
+        if url:
+            message = f"{message}\n  Page URL: {url}"
+        return cls(message, url=url, raw_result=None)
+class ActionError(SentienceBackendError):
+    """
+    Raised when a browser action (click, type, scroll) fails.
+    """
+    def __init__(
+        self,
+        action: str,
+        message: str,
+        coordinates: tuple[float, float] | None = None,
+        original_error: Exception | None = None,
+    ) -> None:
+        self.action = action
+        self.coordinates = coordinates
+        self.original_error = original_error
+        super().__init__(f"{action} failed: {message}")

sentienceapi 0.92.2__py3-none-any.whl → 0.98.0__py3-none-any.whl

Potentially problematic release.

sentienceapi 0.92.2py3-none-any.whl → 0.98.0py3-none-any.whl