PyPI - sentienceapi - Versions diffs - 0.90.16__py3-none-any.whl → 0.98.0__py3-none-any.whl - Mend

sentienceapi 0.90.16py3-none-any.whl → 0.98.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sentienceapi might be problematic. Click here for more details.

Files changed (90) hide show

sentience/__init__.py +120 -6
sentience/_extension_loader.py +156 -1
sentience/action_executor.py +217 -0
sentience/actions.py +758 -30
sentience/agent.py +806 -293
sentience/agent_config.py +3 -0
sentience/agent_runtime.py +840 -0
sentience/asserts/__init__.py +70 -0
sentience/asserts/expect.py +621 -0
sentience/asserts/query.py +383 -0
sentience/async_api.py +89 -1141
sentience/backends/__init__.py +137 -0
sentience/backends/actions.py +372 -0
sentience/backends/browser_use_adapter.py +241 -0
sentience/backends/cdp_backend.py +393 -0
sentience/backends/exceptions.py +211 -0
sentience/backends/playwright_backend.py +194 -0
sentience/backends/protocol.py +216 -0
sentience/backends/sentience_context.py +469 -0
sentience/backends/snapshot.py +483 -0
sentience/base_agent.py +95 -0
sentience/browser.py +678 -39
sentience/browser_evaluator.py +299 -0
sentience/canonicalization.py +207 -0
sentience/cloud_tracing.py +507 -42
sentience/constants.py +6 -0
sentience/conversational_agent.py +77 -43
sentience/cursor_policy.py +142 -0
sentience/element_filter.py +136 -0
sentience/expect.py +98 -2
sentience/extension/background.js +56 -185
sentience/extension/content.js +150 -287
sentience/extension/injected_api.js +1088 -1368
sentience/extension/manifest.json +1 -1
sentience/extension/pkg/sentience_core.d.ts +22 -22
sentience/extension/pkg/sentience_core.js +275 -433
sentience/extension/pkg/sentience_core_bg.wasm +0 -0
sentience/extension/release.json +47 -47
sentience/failure_artifacts.py +241 -0
sentience/formatting.py +9 -53
sentience/inspector.py +183 -1
sentience/integrations/__init__.py +6 -0
sentience/integrations/langchain/__init__.py +12 -0
sentience/integrations/langchain/context.py +18 -0
sentience/integrations/langchain/core.py +326 -0
sentience/integrations/langchain/tools.py +180 -0
sentience/integrations/models.py +46 -0
sentience/integrations/pydanticai/__init__.py +15 -0
sentience/integrations/pydanticai/deps.py +20 -0
sentience/integrations/pydanticai/toolset.py +468 -0
sentience/llm_interaction_handler.py +191 -0
sentience/llm_provider.py +765 -66
sentience/llm_provider_utils.py +120 -0
sentience/llm_response_builder.py +153 -0
sentience/models.py +595 -3
sentience/ordinal.py +280 -0
sentience/overlay.py +109 -2
sentience/protocols.py +228 -0
sentience/query.py +67 -5
sentience/read.py +95 -3
sentience/recorder.py +223 -3
sentience/schemas/trace_v1.json +128 -9
sentience/screenshot.py +48 -2
sentience/sentience_methods.py +86 -0
sentience/snapshot.py +599 -55
sentience/snapshot_diff.py +126 -0
sentience/text_search.py +120 -5
sentience/trace_event_builder.py +148 -0
sentience/trace_file_manager.py +197 -0
sentience/trace_indexing/index_schema.py +95 -7
sentience/trace_indexing/indexer.py +105 -48
sentience/tracer_factory.py +120 -9
sentience/tracing.py +172 -8
sentience/utils/__init__.py +40 -0
sentience/utils/browser.py +46 -0
sentience/{utils.py → utils/element.py} +3 -42
sentience/utils/formatting.py +59 -0
sentience/verification.py +618 -0
sentience/visual_agent.py +2058 -0
sentience/wait.py +68 -2
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/METADATA +199 -40
sentienceapi-0.98.0.dist-info/RECORD +92 -0
sentience/extension/test-content.js +0 -4
sentienceapi-0.90.16.dist-info/RECORD +0 -50
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/WHEEL +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/entry_points.txt +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-APACHE +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-MIT +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/top_level.txt +0 -0

sentience/backends/__init__.py ADDED Viewed

@@ -0,0 +1,137 @@
+"""
+Browser backend abstractions for Sentience SDK.
+This module provides backend protocols and implementations that allow
+Sentience actions (click, type, scroll) to work with different browser
+automation frameworks.
+Supported Backends
+------------------
+**PlaywrightBackend**
+    Wraps Playwright Page objects. Use this when integrating with existing
+    SentienceBrowser or Playwright-based code.
+**CDPBackendV0**
+    Low-level CDP (Chrome DevTools Protocol) backend. Use this when you have
+    direct access to a CDP client and session.
+**BrowserUseAdapter**
+    High-level adapter for browser-use framework. Automatically creates a
+    CDPBackendV0 from a BrowserSession.
+Quick Start with browser-use
+----------------------------
+.. code-block:: python
+    from browser_use import BrowserSession, BrowserProfile
+    from sentience import get_extension_dir, find
+    from sentience.backends import BrowserUseAdapter, snapshot, click, type_text
+    # Setup browser-use with Sentience extension
+    profile = BrowserProfile(args=[f"--load-extension={get_extension_dir()}"])
+    session = BrowserSession(browser_profile=profile)
+    await session.start()
+    # Create adapter and backend
+    adapter = BrowserUseAdapter(session)
+    backend = await adapter.create_backend()
+    # Take snapshot and interact with elements
+    snap = await snapshot(backend)
+    search_box = find(snap, 'role=textbox[name*="Search"]')
+    await click(backend, search_box.bbox)
+    await type_text(backend, "Sentience AI")
+Snapshot Caching
+----------------
+Use CachedSnapshot to reduce redundant snapshot calls in action loops:
+.. code-block:: python
+    from sentience.backends import CachedSnapshot
+    cache = CachedSnapshot(backend, max_age_ms=2000)
+    snap1 = await cache.get()  # Takes fresh snapshot
+    snap2 = await cache.get()  # Returns cached if < 2s old
+    await click(backend, element.bbox)
+    cache.invalidate()  # Force refresh on next get()
+Error Handling
+--------------
+The module provides specific exceptions for common failure modes:
+- ``ExtensionNotLoadedError``: Extension not loaded in browser launch args
+- ``SnapshotError``: window.sentience.snapshot() failed
+- ``ActionError``: Click/type/scroll operation failed
+All exceptions inherit from ``SentienceBackendError`` and include helpful
+fix suggestions in their error messages.
+.. code-block:: python
+    from sentience.backends import ExtensionNotLoadedError, snapshot
+    try:
+        snap = await snapshot(backend)
+    except ExtensionNotLoadedError as e:
+        print(f"Fix suggestion: {e}")
+"""
+from .actions import click, scroll, scroll_to_element, type_text, wait_for_stable
+from .browser_use_adapter import BrowserUseAdapter, BrowserUseCDPTransport
+from .cdp_backend import CDPBackendV0, CDPTransport
+from .exceptions import (
+    ActionError,
+    BackendEvalError,
+    ExtensionDiagnostics,
+    ExtensionInjectionError,
+    ExtensionNotLoadedError,
+    SentienceBackendError,
+    SnapshotError,
+)
+from .playwright_backend import PlaywrightBackend
+from .protocol import BrowserBackend, LayoutMetrics, ViewportInfo
+from .sentience_context import SentienceContext, SentienceContextState, TopElementSelector
+from .snapshot import CachedSnapshot, snapshot
+__all__ = [
+    # Protocol
+    "BrowserBackend",
+    # Models
+    "ViewportInfo",
+    "LayoutMetrics",
+    # CDP Backend
+    "CDPTransport",
+    "CDPBackendV0",
+    # Playwright Backend
+    "PlaywrightBackend",
+    # browser-use adapter
+    "BrowserUseAdapter",
+    "BrowserUseCDPTransport",
+    # SentienceContext (Token-Slasher Context Middleware)
+    "SentienceContext",
+    "SentienceContextState",
+    "TopElementSelector",
+    # Backend-agnostic functions
+    "snapshot",
+    "CachedSnapshot",
+    "click",
+    "type_text",
+    "scroll",
+    "scroll_to_element",
+    "wait_for_stable",
+    # Exceptions
+    "SentienceBackendError",
+    "ExtensionNotLoadedError",
+    "ExtensionInjectionError",
+    "ExtensionDiagnostics",
+    "BackendEvalError",
+    "SnapshotError",
+    "ActionError",
+]

sentience/backends/actions.py ADDED Viewed

@@ -0,0 +1,372 @@
+"""
+Backend-agnostic actions for browser-use integration.
+These actions work with any BrowserBackend implementation,
+enabling Sentience grounding with browser-use or other frameworks.
+Usage with browser-use:
+    from sentience.backends import BrowserUseAdapter
+    from sentience.backends.actions import click, type_text, scroll
+    adapter = BrowserUseAdapter(session)
+    backend = await adapter.create_backend()
+    # Take snapshot and click element
+    snap = await snapshot_from_backend(backend)
+    element = find(snap, 'role=button[name="Submit"]')
+    await click(backend, element.bbox)
+"""
+import asyncio
+import time
+from typing import TYPE_CHECKING, Any, Literal
+from ..cursor_policy import CursorPolicy, build_human_cursor_path
+from ..models import ActionResult, BBox, Snapshot
+if TYPE_CHECKING:
+    from .protocol import BrowserBackend
+async def click(
+    backend: "BrowserBackend",
+    target: BBox | dict[str, float] | tuple[float, float],
+    button: Literal["left", "right", "middle"] = "left",
+    click_count: int = 1,
+    move_first: bool = True,
+    cursor_policy: CursorPolicy | None = None,
+) -> ActionResult:
+    """
+    Click at coordinates using the backend.
+    Args:
+        backend: BrowserBackend implementation
+        target: Click target - BBox (clicks center), dict with x/y, or (x, y) tuple
+        button: Mouse button to click
+        click_count: Number of clicks (1=single, 2=double)
+        move_first: Whether to move mouse to position before clicking
+    Returns:
+        ActionResult with success status
+    Example:
+        # Click at coordinates
+        await click(backend, (100, 200))
+        # Click element bbox center
+        await click(backend, element.bbox)
+        # Double-click
+        await click(backend, element.bbox, click_count=2)
+    """
+    start_time = time.time()
+    # Resolve coordinates
+    x, y = _resolve_coordinates(target)
+    cursor_meta: dict | None = None
+    try:
+        # Optional mouse move for hover effects
+        if move_first:
+            if cursor_policy is not None and cursor_policy.mode == "human":
+                pos = getattr(backend, "_sentience_cursor_pos", None)
+                if not isinstance(pos, tuple) or len(pos) != 2:
+                    pos = (float(x), float(y))
+                cursor_meta = build_human_cursor_path(
+                    start=(float(pos[0]), float(pos[1])),
+                    target=(float(x), float(y)),
+                    policy=cursor_policy,
+                )
+                pts = cursor_meta.get("path", [])
+                duration_ms_move = int(cursor_meta.get("duration_ms") or 0)
+                per_step_s = (
+                    (duration_ms_move / max(1, len(pts))) / 1000.0 if duration_ms_move > 0 else 0.0
+                )
+                for p in pts:
+                    await backend.mouse_move(float(p["x"]), float(p["y"]))
+                    if per_step_s > 0:
+                        await asyncio.sleep(per_step_s)
+                pause_ms = int(cursor_meta.get("pause_before_click_ms") or 0)
+                if pause_ms > 0:
+                    await asyncio.sleep(pause_ms / 1000.0)
+            else:
+                await backend.mouse_move(x, y)
+                await asyncio.sleep(0.02)  # Brief pause for hover
+        # Perform click
+        await backend.mouse_click(x, y, button=button, click_count=click_count)
+        setattr(backend, "_sentience_cursor_pos", (float(x), float(y)))
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+            cursor=cursor_meta,
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "click_failed", "reason": str(e)},
+            cursor=cursor_meta,
+        )
+async def type_text(
+    backend: "BrowserBackend",
+    text: str,
+    target: BBox | dict[str, float] | tuple[float, float] | None = None,
+    clear_first: bool = False,
+) -> ActionResult:
+    """
+    Type text, optionally clicking a target first.
+    Args:
+        backend: BrowserBackend implementation
+        text: Text to type
+        target: Optional click target before typing (BBox, dict, or tuple)
+        clear_first: If True, select all and delete before typing
+    Returns:
+        ActionResult with success status
+    Example:
+        # Type into focused element
+        await type_text(backend, "Hello World")
+        # Click input then type
+        await type_text(backend, "search query", target=search_box.bbox)
+        # Clear and type
+        await type_text(backend, "new value", target=input.bbox, clear_first=True)
+    """
+    start_time = time.time()
+    try:
+        # Click target if provided
+        if target is not None:
+            x, y = _resolve_coordinates(target)
+            await backend.mouse_click(x, y)
+            await asyncio.sleep(0.05)  # Wait for focus
+        # Clear existing content if requested
+        if clear_first:
+            # Select all (Ctrl+A / Cmd+A) and delete
+            await backend.eval("document.execCommand('selectAll')")
+            await asyncio.sleep(0.02)
+        # Type the text
+        await backend.type_text(text)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "type_failed", "reason": str(e)},
+        )
+async def scroll(
+    backend: "BrowserBackend",
+    delta_y: float = 300,
+    target: BBox | dict[str, float] | tuple[float, float] | None = None,
+) -> ActionResult:
+    """
+    Scroll the page or element.
+    Args:
+        backend: BrowserBackend implementation
+        delta_y: Scroll amount (positive=down, negative=up)
+        target: Optional position for scroll (defaults to viewport center)
+    Returns:
+        ActionResult with success status
+    Example:
+        # Scroll down 300px
+        await scroll(backend, 300)
+        # Scroll up 500px
+        await scroll(backend, -500)
+        # Scroll at specific position
+        await scroll(backend, 200, target=(500, 300))
+    """
+    start_time = time.time()
+    try:
+        x: float | None = None
+        y: float | None = None
+        if target is not None:
+            x, y = _resolve_coordinates(target)
+        await backend.wheel(delta_y=delta_y, x=x, y=y)
+        # Wait for scroll to settle
+        await asyncio.sleep(0.1)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "scroll_failed", "reason": str(e)},
+        )
+async def scroll_to_element(
+    backend: "BrowserBackend",
+    element_id: int,
+    behavior: Literal["smooth", "instant", "auto"] = "instant",
+    block: Literal["start", "center", "end", "nearest"] = "center",
+) -> ActionResult:
+    """
+    Scroll element into view using JavaScript scrollIntoView.
+    Args:
+        backend: BrowserBackend implementation
+        element_id: Element ID from snapshot (requires sentience_registry)
+        behavior: Scroll behavior
+        block: Vertical alignment
+    Returns:
+        ActionResult with success status
+    """
+    start_time = time.time()
+    try:
+        scrolled = await backend.eval(
+            f"""
+            (() => {{
+                const el = window.sentience_registry && window.sentience_registry[{element_id}];
+                if (el && el.scrollIntoView) {{
+                    el.scrollIntoView({{
+                        behavior: '{behavior}',
+                        block: '{block}',
+                        inline: 'nearest'
+                    }});
+                    return true;
+                }}
+                return false;
+            }})()
+        """
+        )
+        # Wait for scroll animation
+        wait_time = 0.3 if behavior == "smooth" else 0.05
+        await asyncio.sleep(wait_time)
+        duration_ms = int((time.time() - start_time) * 1000)
+        if scrolled:
+            return ActionResult(
+                success=True,
+                duration_ms=duration_ms,
+                outcome="dom_updated",
+            )
+        else:
+            return ActionResult(
+                success=False,
+                duration_ms=duration_ms,
+                outcome="error",
+                error={"code": "scroll_failed", "reason": "Element not found in registry"},
+            )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "scroll_failed", "reason": str(e)},
+        )
+async def wait_for_stable(
+    backend: "BrowserBackend",
+    state: Literal["interactive", "complete"] = "complete",
+    timeout_ms: int = 10000,
+) -> ActionResult:
+    """
+    Wait for page to reach stable state.
+    Args:
+        backend: BrowserBackend implementation
+        state: Target document.readyState
+        timeout_ms: Maximum wait time
+    Returns:
+        ActionResult with success status
+    """
+    start_time = time.time()
+    try:
+        await backend.wait_ready_state(state=state, timeout_ms=timeout_ms)
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=True,
+            duration_ms=duration_ms,
+            outcome="dom_updated",
+        )
+    except TimeoutError as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "timeout", "reason": str(e)},
+        )
+    except Exception as e:
+        duration_ms = int((time.time() - start_time) * 1000)
+        return ActionResult(
+            success=False,
+            duration_ms=duration_ms,
+            outcome="error",
+            error={"code": "wait_failed", "reason": str(e)},
+        )
+def _resolve_coordinates(
+    target: BBox | dict[str, float] | tuple[float, float],
+) -> tuple[float, float]:
+    """
+    Resolve target to (x, y) coordinates.
+    - BBox: Returns center point
+    - dict: Returns x, y keys (or center if width/height present)
+    - tuple: Returns as-is
+    """
+    if isinstance(target, BBox):
+        return (target.x + target.width / 2, target.y + target.height / 2)
+    elif isinstance(target, tuple):
+        return target
+    elif isinstance(target, dict):
+        # If has width/height, compute center
+        if "width" in target and "height" in target:
+            x = target.get("x", 0) + target["width"] / 2
+            y = target.get("y", 0) + target["height"] / 2
+            return (x, y)
+        # Otherwise use x/y directly
+        return (target.get("x", 0), target.get("y", 0))
+    else:
+        raise ValueError(f"Invalid target type: {type(target)}")

sentienceapi 0.90.16__py3-none-any.whl → 0.98.0__py3-none-any.whl

Potentially problematic release.

sentienceapi 0.90.16py3-none-any.whl → 0.98.0py3-none-any.whl