PyPI - sentienceapi - Versions diffs - 0.90.16__py3-none-any.whl → 0.98.0__py3-none-any.whl - Mend

sentienceapi 0.90.16py3-none-any.whl → 0.98.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of sentienceapi might be problematic. Click here for more details.

Files changed (90) hide show

sentience/__init__.py +120 -6
sentience/_extension_loader.py +156 -1
sentience/action_executor.py +217 -0
sentience/actions.py +758 -30
sentience/agent.py +806 -293
sentience/agent_config.py +3 -0
sentience/agent_runtime.py +840 -0
sentience/asserts/__init__.py +70 -0
sentience/asserts/expect.py +621 -0
sentience/asserts/query.py +383 -0
sentience/async_api.py +89 -1141
sentience/backends/__init__.py +137 -0
sentience/backends/actions.py +372 -0
sentience/backends/browser_use_adapter.py +241 -0
sentience/backends/cdp_backend.py +393 -0
sentience/backends/exceptions.py +211 -0
sentience/backends/playwright_backend.py +194 -0
sentience/backends/protocol.py +216 -0
sentience/backends/sentience_context.py +469 -0
sentience/backends/snapshot.py +483 -0
sentience/base_agent.py +95 -0
sentience/browser.py +678 -39
sentience/browser_evaluator.py +299 -0
sentience/canonicalization.py +207 -0
sentience/cloud_tracing.py +507 -42
sentience/constants.py +6 -0
sentience/conversational_agent.py +77 -43
sentience/cursor_policy.py +142 -0
sentience/element_filter.py +136 -0
sentience/expect.py +98 -2
sentience/extension/background.js +56 -185
sentience/extension/content.js +150 -287
sentience/extension/injected_api.js +1088 -1368
sentience/extension/manifest.json +1 -1
sentience/extension/pkg/sentience_core.d.ts +22 -22
sentience/extension/pkg/sentience_core.js +275 -433
sentience/extension/pkg/sentience_core_bg.wasm +0 -0
sentience/extension/release.json +47 -47
sentience/failure_artifacts.py +241 -0
sentience/formatting.py +9 -53
sentience/inspector.py +183 -1
sentience/integrations/__init__.py +6 -0
sentience/integrations/langchain/__init__.py +12 -0
sentience/integrations/langchain/context.py +18 -0
sentience/integrations/langchain/core.py +326 -0
sentience/integrations/langchain/tools.py +180 -0
sentience/integrations/models.py +46 -0
sentience/integrations/pydanticai/__init__.py +15 -0
sentience/integrations/pydanticai/deps.py +20 -0
sentience/integrations/pydanticai/toolset.py +468 -0
sentience/llm_interaction_handler.py +191 -0
sentience/llm_provider.py +765 -66
sentience/llm_provider_utils.py +120 -0
sentience/llm_response_builder.py +153 -0
sentience/models.py +595 -3
sentience/ordinal.py +280 -0
sentience/overlay.py +109 -2
sentience/protocols.py +228 -0
sentience/query.py +67 -5
sentience/read.py +95 -3
sentience/recorder.py +223 -3
sentience/schemas/trace_v1.json +128 -9
sentience/screenshot.py +48 -2
sentience/sentience_methods.py +86 -0
sentience/snapshot.py +599 -55
sentience/snapshot_diff.py +126 -0
sentience/text_search.py +120 -5
sentience/trace_event_builder.py +148 -0
sentience/trace_file_manager.py +197 -0
sentience/trace_indexing/index_schema.py +95 -7
sentience/trace_indexing/indexer.py +105 -48
sentience/tracer_factory.py +120 -9
sentience/tracing.py +172 -8
sentience/utils/__init__.py +40 -0
sentience/utils/browser.py +46 -0
sentience/{utils.py → utils/element.py} +3 -42
sentience/utils/formatting.py +59 -0
sentience/verification.py +618 -0
sentience/visual_agent.py +2058 -0
sentience/wait.py +68 -2
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/METADATA +199 -40
sentienceapi-0.98.0.dist-info/RECORD +92 -0
sentience/extension/test-content.js +0 -4
sentienceapi-0.90.16.dist-info/RECORD +0 -50
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/WHEEL +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/entry_points.txt +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-APACHE +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/licenses/LICENSE-MIT +0 -0
{sentienceapi-0.90.16.dist-info → sentienceapi-0.98.0.dist-info}/top_level.txt +0 -0

sentience/actions.py CHANGED Viewed

@@ -1,12 +1,18 @@
+from typing import Optional
 """
 Actions v1 - click, type, press
 """
+import asyncio
 import time
-from .browser import SentienceBrowser
+from .browser import AsyncSentienceBrowser, SentienceBrowser
+from .browser_evaluator import BrowserEvaluator
+from .cursor_policy import CursorPolicy, build_human_cursor_path
 from .models import ActionResult, BBox, Snapshot
-from .snapshot import snapshot
+from .sentience_methods import SentienceMethod
+from .snapshot import snapshot, snapshot_async
 def click(  # noqa: C901
@@ -14,6 +20,7 @@ def click(  # noqa: C901
     element_id: int,
     use_mouse: bool = True,
     take_snapshot: bool = False,
+    cursor_policy: CursorPolicy | None = None,
 ) -> ActionResult:
     """
     Click an element by ID using hybrid approach (mouse simulation by default)
@@ -33,6 +40,7 @@ def click(  # noqa: C901
     start_time = time.time()
     url_before = browser.page.url
+    cursor_meta: dict | None = None
     if use_mouse:
         # Hybrid approach: Get element bbox from snapshot, calculate center, use mouse.click()
@@ -48,9 +56,49 @@ def click(  # noqa: C901
                 # Calculate center of element bbox
                 center_x = element.bbox.x + element.bbox.width / 2
                 center_y = element.bbox.y + element.bbox.height / 2
-                # Use Playwright's native mouse click for realistic simulation
+                # Optional: human-like cursor movement (opt-in)
                 try:
-                    browser.page.mouse.click(center_x, center_y)
+                    if cursor_policy is not None and cursor_policy.mode == "human":
+                        # Best-effort cursor state on browser instance
+                        pos = getattr(browser, "_sentience_cursor_pos", None)
+                        if not isinstance(pos, tuple) or len(pos) != 2:
+                            try:
+                                vp = browser.page.viewport_size or {}
+                                pos = (
+                                    float(vp.get("width", 0)) / 2.0,
+                                    float(vp.get("height", 0)) / 2.0,
+                                )
+                            except Exception:
+                                pos = (0.0, 0.0)
+                        cursor_meta = build_human_cursor_path(
+                            start=(float(pos[0]), float(pos[1])),
+                            target=(float(center_x), float(center_y)),
+                            policy=cursor_policy,
+                        )
+                        pts = cursor_meta.get("path", [])
+                        steps = int(cursor_meta.get("steps") or max(1, len(pts)))
+                        duration_ms = int(cursor_meta.get("duration_ms") or 0)
+                        per_step_s = (
+                            (duration_ms / max(1, len(pts))) / 1000.0 if duration_ms > 0 else 0.0
+                        )
+                        for p in pts:
+                            browser.page.mouse.move(float(p["x"]), float(p["y"]))
+                            if per_step_s > 0:
+                                time.sleep(per_step_s)
+                        pause_ms = int(cursor_meta.get("pause_before_click_ms") or 0)
+                        if pause_ms > 0:
+                            time.sleep(pause_ms / 1000.0)
+                        browser.page.mouse.click(center_x, center_y)
+                        setattr(
+                            browser, "_sentience_cursor_pos", (float(center_x), float(center_y))
+                        )
+                    else:
+                        # Default behavior (no regression)
+                        browser.page.mouse.click(center_x, center_y)
+                        setattr(
+                            browser, "_sentience_cursor_pos", (float(center_x), float(center_y))
+                        )
                     success = True
                 except Exception:
                     # If navigation happens, mouse.click might fail, but that's OK
@@ -59,13 +107,8 @@ def click(  # noqa: C901
             else:
                 # Fallback to JS click if element not found in snapshot
                 try:
-                    success = browser.page.evaluate(
-                        """
-                        (id) => {
-                            return window.sentience.click(id);
-                        }
-                        """,
-                        element_id,
+                    success = BrowserEvaluator.invoke(
+                        browser.page, SentienceMethod.CLICK, element_id
                     )
                 except Exception:
                     # Navigation might have destroyed context, assume success if URL changed
@@ -73,27 +116,13 @@ def click(  # noqa: C901
         except Exception:
             # Fallback to JS click on error
             try:
-                success = browser.page.evaluate(
-                    """
-                    (id) => {
-                        return window.sentience.click(id);
-                    }
-                    """,
-                    element_id,
-                )
+                success = BrowserEvaluator.invoke(browser.page, SentienceMethod.CLICK, element_id)
             except Exception:
                 # Navigation might have destroyed context, assume success if URL changed
                 success = True
     else:
         # Legacy JS-based click
-        success = browser.page.evaluate(
-            """
-            (id) => {
-                return window.sentience.click(id);
-            }
-            """,
-            element_id,
-        )
+        success = BrowserEvaluator.invoke(browser.page, SentienceMethod.CLICK, element_id)
     # Wait a bit for navigation/DOM updates
     try:
@@ -137,6 +166,7 @@ def click(  # noqa: C901
         outcome=outcome,
         url_changed=url_changed,
         snapshot_after=snapshot_after,
+        cursor=cursor_meta,
         error=(
             None
             if success
@@ -149,7 +179,11 @@ def click(  # noqa: C901
 def type_text(
-    browser: SentienceBrowser, element_id: int, text: str, take_snapshot: bool = False
+    browser: SentienceBrowser,
+    element_id: int,
+    text: str,
+    take_snapshot: bool = False,
+    delay_ms: float = 0,
 ) -> ActionResult:
     """
     Type text into an element (focus then input)
@@ -159,9 +193,16 @@ def type_text(
         element_id: Element ID from snapshot
         text: Text to type
         take_snapshot: Whether to take snapshot after action
+        delay_ms: Delay between keystrokes in milliseconds for human-like typing (default: 0)
     Returns:
         ActionResult
+    Example:
+        >>> # Type instantly (default behavior)
+        >>> type_text(browser, element_id, "Hello World")
+        >>> # Type with human-like delay (~10ms between keystrokes)
+        >>> type_text(browser, element_id, "Hello World", delay_ms=10)
     """
     if not browser.page:
         raise RuntimeError("Browser not started. Call browser.start() first.")
@@ -192,8 +233,8 @@ def type_text(
             error={"code": "focus_failed", "reason": "Element not found"},
         )
-    # Type using Playwright keyboard
-    browser.page.keyboard.type(text)
+    # Type using Playwright keyboard with optional delay between keystrokes
+    browser.page.keyboard.type(text, delay=delay_ms)
     duration_ms = int((time.time() - start_time) * 1000)
     url_after = browser.page.url
@@ -257,6 +298,94 @@ def press(browser: SentienceBrowser, key: str, take_snapshot: bool = False) -> A
     )
+def scroll_to(
+    browser: SentienceBrowser,
+    element_id: int,
+    behavior: str = "smooth",
+    block: str = "center",
+    take_snapshot: bool = False,
+) -> ActionResult:
+    """
+    Scroll an element into view
+    Scrolls the page so that the specified element is visible in the viewport.
+    Uses the element registry to find the element and scrollIntoView() to scroll it.
+    Args:
+        browser: SentienceBrowser instance
+        element_id: Element ID from snapshot to scroll into view
+        behavior: Scroll behavior - 'smooth', 'instant', or 'auto' (default: 'smooth')
+        block: Vertical alignment - 'start', 'center', 'end', or 'nearest' (default: 'center')
+        take_snapshot: Whether to take snapshot after action
+    Returns:
+        ActionResult
+    Example:
+        >>> snap = snapshot(browser)
+        >>> button = find(snap, 'role=button[name="Submit"]')
+        >>> if button:
+        >>>     # Scroll element into view with smooth animation
+        >>>     scroll_to(browser, button.id)
+        >>>     # Scroll instantly to top of viewport
+        >>>     scroll_to(browser, button.id, behavior='instant', block='start')
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call browser.start() first.")
+    start_time = time.time()
+    url_before = browser.page.url
+    # Scroll element into view using the element registry
+    scrolled = browser.page.evaluate(
+        """
+        (args) => {
+            const el = window.sentience_registry[args.id];
+            if (el && el.scrollIntoView) {
+                el.scrollIntoView({
+                    behavior: args.behavior,
+                    block: args.block,
+                    inline: 'nearest'
+                });
+                return true;
+            }
+            return false;
+        }
+        """,
+        {"id": element_id, "behavior": behavior, "block": block},
+    )
+    if not scrolled:
+        return ActionResult(
+            success=False,
+            duration_ms=int((time.time() - start_time) * 1000),
+            outcome="error",
+            error={"code": "scroll_failed", "reason": "Element not found or not scrollable"},
+        )
+    # Wait a bit for scroll to complete (especially for smooth scrolling)
+    wait_time = 500 if behavior == "smooth" else 100
+    browser.page.wait_for_timeout(wait_time)
+    duration_ms = int((time.time() - start_time) * 1000)
+    url_after = browser.page.url
+    url_changed = url_before != url_after
+    outcome = "navigated" if url_changed else "dom_updated"
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        snapshot_after = snapshot(browser)
+    return ActionResult(
+        success=True,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+    )
 def _highlight_rect(
     browser: SentienceBrowser, rect: dict[str, float], duration_sec: float = 2.0
 ) -> None:
@@ -330,6 +459,7 @@ def click_rect(
     highlight: bool = True,
     highlight_duration: float = 2.0,
     take_snapshot: bool = False,
+    cursor_policy: CursorPolicy | None = None,
 ) -> ActionResult:
     """
     Click at the center of a rectangle using Playwright's native mouse simulation.
@@ -385,6 +515,7 @@ def click_rect(
     # Calculate center of rectangle
     center_x = x + w / 2
     center_y = y + h / 2
+    cursor_meta: dict | None = None
     # Show highlight before clicking (if enabled)
     if highlight:
@@ -395,7 +526,35 @@ def click_rect(
     # Use Playwright's native mouse click for realistic simulation
     # This triggers hover, focus, mousedown, mouseup sequences
     try:
+        if cursor_policy is not None and cursor_policy.mode == "human":
+            pos = getattr(browser, "_sentience_cursor_pos", None)
+            if not isinstance(pos, tuple) or len(pos) != 2:
+                try:
+                    vp = browser.page.viewport_size or {}
+                    pos = (float(vp.get("width", 0)) / 2.0, float(vp.get("height", 0)) / 2.0)
+                except Exception:
+                    pos = (0.0, 0.0)
+            cursor_meta = build_human_cursor_path(
+                start=(float(pos[0]), float(pos[1])),
+                target=(float(center_x), float(center_y)),
+                policy=cursor_policy,
+            )
+            pts = cursor_meta.get("path", [])
+            duration_ms_move = int(cursor_meta.get("duration_ms") or 0)
+            per_step_s = (
+                (duration_ms_move / max(1, len(pts))) / 1000.0 if duration_ms_move > 0 else 0.0
+            )
+            for p in pts:
+                browser.page.mouse.move(float(p["x"]), float(p["y"]))
+                if per_step_s > 0:
+                    time.sleep(per_step_s)
+            pause_ms = int(cursor_meta.get("pause_before_click_ms") or 0)
+            if pause_ms > 0:
+                time.sleep(pause_ms / 1000.0)
         browser.page.mouse.click(center_x, center_y)
+        setattr(browser, "_sentience_cursor_pos", (float(center_x), float(center_y)))
         success = True
     except Exception as e:
         success = False
@@ -428,6 +587,575 @@ def click_rect(
         outcome=outcome,
         url_changed=url_changed,
         snapshot_after=snapshot_after,
+        cursor=cursor_meta,
+        error=(
+            None
+            if success
+            else {
+                "code": "click_failed",
+                "reason": error_msg if not success else "Click failed",
+            }
+        ),
+    )
+# ========== Async Action Functions ==========
+async def click_async(
+    browser: AsyncSentienceBrowser,
+    element_id: int,
+    use_mouse: bool = True,
+    take_snapshot: bool = False,
+    cursor_policy: CursorPolicy | None = None,
+) -> ActionResult:
+    """
+    Click an element by ID using hybrid approach (async)
+    Args:
+        browser: AsyncSentienceBrowser instance
+        element_id: Element ID from snapshot
+        use_mouse: If True, use Playwright's mouse.click() at element center
+        take_snapshot: Whether to take snapshot after action
+    Returns:
+        ActionResult
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call await browser.start() first.")
+    start_time = time.time()
+    url_before = browser.page.url
+    cursor_meta: dict | None = None
+    if use_mouse:
+        try:
+            snap = await snapshot_async(browser)
+            element = None
+            for el in snap.elements:
+                if el.id == element_id:
+                    element = el
+                    break
+            if element:
+                center_x = element.bbox.x + element.bbox.width / 2
+                center_y = element.bbox.y + element.bbox.height / 2
+                try:
+                    if cursor_policy is not None and cursor_policy.mode == "human":
+                        pos = getattr(browser, "_sentience_cursor_pos", None)
+                        if not isinstance(pos, tuple) or len(pos) != 2:
+                            try:
+                                vp = browser.page.viewport_size or {}
+                                pos = (
+                                    float(vp.get("width", 0)) / 2.0,
+                                    float(vp.get("height", 0)) / 2.0,
+                                )
+                            except Exception:
+                                pos = (0.0, 0.0)
+                        cursor_meta = build_human_cursor_path(
+                            start=(float(pos[0]), float(pos[1])),
+                            target=(float(center_x), float(center_y)),
+                            policy=cursor_policy,
+                        )
+                        pts = cursor_meta.get("path", [])
+                        duration_ms = int(cursor_meta.get("duration_ms") or 0)
+                        per_step_s = (
+                            (duration_ms / max(1, len(pts))) / 1000.0 if duration_ms > 0 else 0.0
+                        )
+                        for p in pts:
+                            await browser.page.mouse.move(float(p["x"]), float(p["y"]))
+                            if per_step_s > 0:
+                                await asyncio.sleep(per_step_s)
+                        pause_ms = int(cursor_meta.get("pause_before_click_ms") or 0)
+                        if pause_ms > 0:
+                            await asyncio.sleep(pause_ms / 1000.0)
+                        await browser.page.mouse.click(center_x, center_y)
+                        setattr(
+                            browser, "_sentience_cursor_pos", (float(center_x), float(center_y))
+                        )
+                    else:
+                        await browser.page.mouse.click(center_x, center_y)
+                        setattr(
+                            browser, "_sentience_cursor_pos", (float(center_x), float(center_y))
+                        )
+                    success = True
+                except Exception:
+                    success = True
+            else:
+                try:
+                    success = await browser.page.evaluate(
+                        """
+                        (id) => {
+                            return window.sentience.click(id);
+                        }
+                        """,
+                        element_id,
+                    )
+                except Exception:
+                    success = True
+        except Exception:
+            try:
+                success = await browser.page.evaluate(
+                    """
+                    (id) => {
+                        return window.sentience.click(id);
+                    }
+                    """,
+                    element_id,
+                )
+            except Exception:
+                success = True
+    else:
+        success = await browser.page.evaluate(
+            """
+            (id) => {
+                return window.sentience.click(id);
+            }
+            """,
+            element_id,
+        )
+    # Wait a bit for navigation/DOM updates
+    try:
+        await browser.page.wait_for_timeout(500)
+    except Exception:
+        pass
+    duration_ms = int((time.time() - start_time) * 1000)
+    # Check if URL changed
+    try:
+        url_after = browser.page.url
+        url_changed = url_before != url_after
+    except Exception:
+        url_after = url_before
+        url_changed = True
+    # Determine outcome
+    outcome: str | None = None
+    if url_changed:
+        outcome = "navigated"
+    elif success:
+        outcome = "dom_updated"
+    else:
+        outcome = "error"
+    # Optional snapshot after
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        try:
+            snapshot_after = await snapshot_async(browser)
+        except Exception:
+            pass
+    return ActionResult(
+        success=success,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+        cursor=cursor_meta,
+        error=(
+            None
+            if success
+            else {
+                "code": "click_failed",
+                "reason": "Element not found or not clickable",
+            }
+        ),
+    )
+async def type_text_async(
+    browser: AsyncSentienceBrowser,
+    element_id: int,
+    text: str,
+    take_snapshot: bool = False,
+    delay_ms: float = 0,
+) -> ActionResult:
+    """
+    Type text into an element (async)
+    Args:
+        browser: AsyncSentienceBrowser instance
+        element_id: Element ID from snapshot
+        text: Text to type
+        take_snapshot: Whether to take snapshot after action
+        delay_ms: Delay between keystrokes in milliseconds for human-like typing (default: 0)
+    Returns:
+        ActionResult
+    Example:
+        >>> # Type instantly (default behavior)
+        >>> await type_text_async(browser, element_id, "Hello World")
+        >>> # Type with human-like delay (~10ms between keystrokes)
+        >>> await type_text_async(browser, element_id, "Hello World", delay_ms=10)
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call await browser.start() first.")
+    start_time = time.time()
+    url_before = browser.page.url
+    # Focus element first
+    focused = await browser.page.evaluate(
+        """
+        (id) => {
+            const el = window.sentience_registry[id];
+            if (el) {
+                el.focus();
+                return true;
+            }
+            return false;
+        }
+        """,
+        element_id,
+    )
+    if not focused:
+        return ActionResult(
+            success=False,
+            duration_ms=int((time.time() - start_time) * 1000),
+            outcome="error",
+            error={"code": "focus_failed", "reason": "Element not found"},
+        )
+    # Type using Playwright keyboard with optional delay between keystrokes
+    await browser.page.keyboard.type(text, delay=delay_ms)
+    duration_ms = int((time.time() - start_time) * 1000)
+    url_after = browser.page.url
+    url_changed = url_before != url_after
+    outcome = "navigated" if url_changed else "dom_updated"
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        snapshot_after = await snapshot_async(browser)
+    return ActionResult(
+        success=True,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+    )
+async def press_async(
+    browser: AsyncSentienceBrowser, key: str, take_snapshot: bool = False
+) -> ActionResult:
+    """
+    Press a keyboard key (async)
+    Args:
+        browser: AsyncSentienceBrowser instance
+        key: Key to press (e.g., "Enter", "Escape", "Tab")
+        take_snapshot: Whether to take snapshot after action
+    Returns:
+        ActionResult
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call await browser.start() first.")
+    start_time = time.time()
+    url_before = browser.page.url
+    # Press key using Playwright
+    await browser.page.keyboard.press(key)
+    # Wait a bit for navigation/DOM updates
+    await browser.page.wait_for_timeout(500)
+    duration_ms = int((time.time() - start_time) * 1000)
+    url_after = browser.page.url
+    url_changed = url_before != url_after
+    outcome = "navigated" if url_changed else "dom_updated"
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        snapshot_after = await snapshot_async(browser)
+    return ActionResult(
+        success=True,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+    )
+async def scroll_to_async(
+    browser: AsyncSentienceBrowser,
+    element_id: int,
+    behavior: str = "smooth",
+    block: str = "center",
+    take_snapshot: bool = False,
+) -> ActionResult:
+    """
+    Scroll an element into view (async)
+    Scrolls the page so that the specified element is visible in the viewport.
+    Uses the element registry to find the element and scrollIntoView() to scroll it.
+    Args:
+        browser: AsyncSentienceBrowser instance
+        element_id: Element ID from snapshot to scroll into view
+        behavior: Scroll behavior - 'smooth', 'instant', or 'auto' (default: 'smooth')
+        block: Vertical alignment - 'start', 'center', 'end', or 'nearest' (default: 'center')
+        take_snapshot: Whether to take snapshot after action
+    Returns:
+        ActionResult
+    Example:
+        >>> snap = await snapshot_async(browser)
+        >>> button = find(snap, 'role=button[name="Submit"]')
+        >>> if button:
+        >>>     # Scroll element into view with smooth animation
+        >>>     await scroll_to_async(browser, button.id)
+        >>>     # Scroll instantly to top of viewport
+        >>>     await scroll_to_async(browser, button.id, behavior='instant', block='start')
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call await browser.start() first.")
+    start_time = time.time()
+    url_before = browser.page.url
+    # Scroll element into view using the element registry
+    scrolled = await browser.page.evaluate(
+        """
+        (args) => {
+            const el = window.sentience_registry[args.id];
+            if (el && el.scrollIntoView) {
+                el.scrollIntoView({
+                    behavior: args.behavior,
+                    block: args.block,
+                    inline: 'nearest'
+                });
+                return true;
+            }
+            return false;
+        }
+        """,
+        {"id": element_id, "behavior": behavior, "block": block},
+    )
+    if not scrolled:
+        return ActionResult(
+            success=False,
+            duration_ms=int((time.time() - start_time) * 1000),
+            outcome="error",
+            error={"code": "scroll_failed", "reason": "Element not found or not scrollable"},
+        )
+    # Wait a bit for scroll to complete (especially for smooth scrolling)
+    wait_time = 500 if behavior == "smooth" else 100
+    await browser.page.wait_for_timeout(wait_time)
+    duration_ms = int((time.time() - start_time) * 1000)
+    url_after = browser.page.url
+    url_changed = url_before != url_after
+    outcome = "navigated" if url_changed else "dom_updated"
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        snapshot_after = await snapshot_async(browser)
+    return ActionResult(
+        success=True,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+    )
+async def _highlight_rect_async(
+    browser: AsyncSentienceBrowser, rect: dict[str, float], duration_sec: float = 2.0
+) -> None:
+    """Highlight a rectangle with a red border overlay (async)"""
+    if not browser.page:
+        return
+    highlight_id = f"sentience_highlight_{int(time.time() * 1000)}"
+    args = {
+        "rect": {
+            "x": rect["x"],
+            "y": rect["y"],
+            "w": rect["w"],
+            "h": rect["h"],
+        },
+        "highlightId": highlight_id,
+        "durationSec": duration_sec,
+    }
+    await browser.page.evaluate(
+        """
+        (args) => {
+            const { rect, highlightId, durationSec } = args;
+            const overlay = document.createElement('div');
+            overlay.id = highlightId;
+            overlay.style.position = 'fixed';
+            overlay.style.left = `${rect.x}px`;
+            overlay.style.top = `${rect.y}px`;
+            overlay.style.width = `${rect.w}px`;
+            overlay.style.height = `${rect.h}px`;
+            overlay.style.border = '3px solid red';
+            overlay.style.borderRadius = '2px';
+            overlay.style.boxSizing = 'border-box';
+            overlay.style.pointerEvents = 'none';
+            overlay.style.zIndex = '999999';
+            overlay.style.backgroundColor = 'rgba(255, 0, 0, 0.1)';
+            overlay.style.transition = 'opacity 0.3s ease-out';
+            document.body.appendChild(overlay);
+            setTimeout(() => {
+                overlay.style.opacity = '0';
+                setTimeout(() => {
+                    if (overlay.parentNode) {
+                        overlay.parentNode.removeChild(overlay);
+                    }
+                }, 300);
+            }, durationSec * 1000);
+        }
+        """,
+        args,
+    )
+async def click_rect_async(
+    browser: AsyncSentienceBrowser,
+    rect: dict[str, float] | BBox,
+    highlight: bool = True,
+    highlight_duration: float = 2.0,
+    take_snapshot: bool = False,
+    cursor_policy: CursorPolicy | None = None,
+) -> ActionResult:
+    """
+    Click at the center of a rectangle (async)
+    Args:
+        browser: AsyncSentienceBrowser instance
+        rect: Dictionary with x, y, width (w), height (h) keys, or BBox object
+        highlight: Whether to show a red border highlight when clicking
+        highlight_duration: How long to show the highlight in seconds
+        take_snapshot: Whether to take snapshot after action
+    Returns:
+        ActionResult
+    """
+    if not browser.page:
+        raise RuntimeError("Browser not started. Call await browser.start() first.")
+    # Handle BBox object or dict
+    if isinstance(rect, BBox):
+        x = rect.x
+        y = rect.y
+        w = rect.width
+        h = rect.height
+    else:
+        x = rect.get("x", 0)
+        y = rect.get("y", 0)
+        w = rect.get("w") or rect.get("width", 0)
+        h = rect.get("h") or rect.get("height", 0)
+    if w <= 0 or h <= 0:
+        return ActionResult(
+            success=False,
+            duration_ms=0,
+            outcome="error",
+            error={
+                "code": "invalid_rect",
+                "reason": "Rectangle width and height must be positive",
+            },
+        )
+    start_time = time.time()
+    url_before = browser.page.url
+    # Calculate center of rectangle
+    center_x = x + w / 2
+    center_y = y + h / 2
+    cursor_meta: dict | None = None
+    # Show highlight before clicking
+    if highlight:
+        await _highlight_rect_async(browser, {"x": x, "y": y, "w": w, "h": h}, highlight_duration)
+        await browser.page.wait_for_timeout(50)
+    # Use Playwright's native mouse click
+    try:
+        if cursor_policy is not None and cursor_policy.mode == "human":
+            pos = getattr(browser, "_sentience_cursor_pos", None)
+            if not isinstance(pos, tuple) or len(pos) != 2:
+                try:
+                    vp = browser.page.viewport_size or {}
+                    pos = (float(vp.get("width", 0)) / 2.0, float(vp.get("height", 0)) / 2.0)
+                except Exception:
+                    pos = (0.0, 0.0)
+            cursor_meta = build_human_cursor_path(
+                start=(float(pos[0]), float(pos[1])),
+                target=(float(center_x), float(center_y)),
+                policy=cursor_policy,
+            )
+            pts = cursor_meta.get("path", [])
+            duration_ms_move = int(cursor_meta.get("duration_ms") or 0)
+            per_step_s = (
+                (duration_ms_move / max(1, len(pts))) / 1000.0 if duration_ms_move > 0 else 0.0
+            )
+            for p in pts:
+                await browser.page.mouse.move(float(p["x"]), float(p["y"]))
+                if per_step_s > 0:
+                    await asyncio.sleep(per_step_s)
+            pause_ms = int(cursor_meta.get("pause_before_click_ms") or 0)
+            if pause_ms > 0:
+                await asyncio.sleep(pause_ms / 1000.0)
+        await browser.page.mouse.click(center_x, center_y)
+        setattr(browser, "_sentience_cursor_pos", (float(center_x), float(center_y)))
+        success = True
+    except Exception as e:
+        success = False
+        error_msg = str(e)
+    # Wait a bit for navigation/DOM updates
+    await browser.page.wait_for_timeout(500)
+    duration_ms = int((time.time() - start_time) * 1000)
+    url_after = browser.page.url
+    url_changed = url_before != url_after
+    # Determine outcome
+    outcome: str | None = None
+    if url_changed:
+        outcome = "navigated"
+    elif success:
+        outcome = "dom_updated"
+    else:
+        outcome = "error"
+    # Optional snapshot after
+    snapshot_after: Snapshot | None = None
+    if take_snapshot:
+        snapshot_after = await snapshot_async(browser)
+    return ActionResult(
+        success=success,
+        duration_ms=duration_ms,
+        outcome=outcome,
+        url_changed=url_changed,
+        snapshot_after=snapshot_after,
+        cursor=cursor_meta,
         error=(
             None
             if success

sentienceapi 0.90.16__py3-none-any.whl → 0.98.0__py3-none-any.whl

Potentially problematic release.

sentienceapi 0.90.16py3-none-any.whl → 0.98.0py3-none-any.whl