PyPI - notte-sdk - Versions diffs - 0.0.dev0__py3-none-any.whl - Mend

notte-sdk 0.0.dev0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

notte_sdk/__init__.py +7 -0
notte_sdk/client.py +50 -0
notte_sdk/endpoints/__init__.py +0 -0
notte_sdk/endpoints/agents.py +504 -0
notte_sdk/endpoints/base.py +247 -0
notte_sdk/endpoints/page.py +215 -0
notte_sdk/endpoints/personas.py +285 -0
notte_sdk/endpoints/sessions.py +542 -0
notte_sdk/endpoints/vaults.py +83 -0
notte_sdk/errors.py +40 -0
notte_sdk/py.typed +0 -0
notte_sdk/types.py +851 -0
notte_sdk/vault.py +68 -0
notte_sdk/websockets/__init__.py +0 -0
notte_sdk/websockets/recording.py +106 -0
notte_sdk-0.0.dev0.dist-info/METADATA +8 -0
notte_sdk-0.0.dev0.dist-info/RECORD +18 -0
notte_sdk-0.0.dev0.dist-info/WHEEL +4 -0

notte_sdk/types.py ADDED Viewed

@@ -0,0 +1,851 @@
+import datetime as dt
+import json
+from base64 import b64decode, b64encode
+from collections.abc import Sequence
+from enum import StrEnum
+from pathlib import Path
+from typing import Annotated, Any, Generic, Literal, Required, TypeVar
+from notte_core.actions.base import Action, BrowserAction
+from notte_core.browser.observation import Observation, TrajectoryProgress
+from notte_core.browser.snapshot import SnapshotMetadata, TabsData
+from notte_core.controller.actions import BaseAction
+from notte_core.controller.space import BaseActionSpace
+from notte_core.credentials.base import BaseVault, CredentialField, CredentialsDict
+from notte_core.data.space import DataSpace
+from notte_core.llms.engine import LlmModel
+from notte_core.utils.pydantic_schema import create_model_from_schema
+from notte_core.utils.url import get_root_domain
+from pydantic import BaseModel, Field, field_validator, model_validator
+from typing_extensions import TypedDict, override
+# ############################################################
+# Session Management
+# ############################################################
+DEFAULT_OPERATION_SESSION_TIMEOUT_IN_MINUTES = 3
+DEFAULT_GLOBAL_SESSION_TIMEOUT_IN_MINUTES = 30
+DEFAULT_MAX_NB_ACTIONS = 100
+DEFAULT_MAX_NB_STEPS = 20
+DEFAULT_LIMIT_LIST_ITEMS = 10
+class ExecutionResponse(BaseModel):
+    success: Annotated[bool, Field(description="Whether the operation was successful")]
+    message: Annotated[str, Field(description="A message describing the operation")]
+class PlaywrightProxySettings(TypedDict, total=False):
+    server: str
+    bypass: str | None
+    username: str | None
+    password: str | None
+class BrowserType(StrEnum):
+    CHROMIUM = "chromium"
+    CHROME = "chrome"
+    FIREFOX = "firefox"
+class ProxyGeolocation(BaseModel):
+    """
+    Geolocation settings for the proxy.
+    E.g. "New York, NY, US"
+    """
+    city: str
+    state: str
+    country: str
+class ProxyType(StrEnum):
+    NOTTE = "notte"
+    EXTERNAL = "external"
+class ProxySettings(BaseModel):
+    type: ProxyType
+    server: str | None
+    bypass: str | None
+    username: str | None
+    password: str | None
+    # TODO: enable geolocation later on
+    # geolocation: ProxyGeolocation | None
+    @field_validator("server")
+    @classmethod
+    def validate_server(cls, v: str | None, info: Any) -> str | None:
+        if info.data.get("type") == ProxyType.EXTERNAL and v is None:
+            raise ValueError("Server is required for external proxy type")
+        return v
+    def to_playwright(self) -> PlaywrightProxySettings:
+        if self.server is None:
+            raise ValueError("Proxy server is required")
+        return PlaywrightProxySettings(
+            server=self.server,
+            bypass=self.bypass,
+            username=self.username,
+            password=self.password,
+        )
+class Cookie(BaseModel):
+    name: str
+    domain: str
+    path: str
+    httpOnly: bool
+    expirationDate: float | None = None
+    hostOnly: bool | None = None
+    sameSite: str | None = None
+    secure: bool | None = None
+    session: bool | None = None
+    storeId: str | None = None
+    value: str
+    expires: float | None = Field(default=None)
+    @model_validator(mode="before")
+    @classmethod
+    def validate_expiration(cls, data: dict[str, Any]) -> dict[str, Any]:
+        # Handle either expirationDate or expires being provided
+        if data.get("expirationDate") is None and data.get("expires") is not None:
+            data["expirationDate"] = float(data["expires"])
+        elif data.get("expires") is None and data.get("expirationDate") is not None:
+            data["expires"] = float(data["expirationDate"])
+        return data
+    @override
+    def model_post_init(self, __context: Any) -> None:
+        # Set expires if expirationDate is provided but expires is not
+        if self.expirationDate is not None and self.expires is None:
+            self.expires = float(self.expirationDate)
+        # Set expirationDate if expires is provided but expirationDate is not
+        elif self.expires is not None and self.expirationDate is None:
+            self.expirationDate = float(self.expires)
+        if self.sameSite is not None:
+            self.sameSite = self.sameSite.lower()
+            self.sameSite = self.sameSite[0].upper() + self.sameSite[1:]
+    @staticmethod
+    def from_json(path: str | Path) -> list["Cookie"]:
+        path = Path(path)
+        if not path.exists():
+            raise FileNotFoundError(f"Cookies file not found at {path}")
+        with open(path, "r") as f:
+            cookies_json = json.load(f)
+        cookies = [Cookie.model_validate(cookie) for cookie in cookies_json]
+        return cookies
+class UploadCookiesRequest(BaseModel):
+    cookies: list[Cookie]
+    @staticmethod
+    def from_json(path: str | Path) -> "UploadCookiesRequest":
+        cookies = Cookie.from_json(path)
+        return UploadCookiesRequest(cookies=cookies)
+class UploadCookiesResponse(BaseModel):
+    success: bool
+    message: str
+class ReplayResponse(BaseModel):
+    replay: Annotated[bytes | None, Field(description="The session replay in `.webp` format", repr=False)] = None
+    model_config = {  # type: ignore[reportUnknownMemberType]
+        "json_encoders": {
+            bytes: lambda v: b64encode(v).decode("utf-8") if v else None,
+        }
+    }
+    @field_validator("replay", mode="before")
+    @classmethod
+    def decode_replay(cls, value: str | None) -> bytes | None:
+        if value is None:
+            return None
+        if isinstance(value, bytes):
+            return value
+        if not isinstance(value, str):  # pyright: ignore[reportUnnecessaryIsInstance]
+            raise ValueError("replay must be a bytes or a base64 encoded string")  # pyright: ignore[reportUnreachable]
+        return b64decode(value.encode("utf-8"))
+    @override
+    def model_dump(self, *args: Any, **kwargs: Any) -> dict[str, Any]:
+        data = super().model_dump(*args, **kwargs)
+        if self.replay is not None:
+            data["replay"] = b64encode(self.replay).decode("utf-8")
+        return data
+class SessionStartRequestDict(TypedDict, total=False):
+    timeout_minutes: int
+    max_steps: int
+    proxies: list[ProxySettings] | bool
+    browser_type: BrowserType
+    chrome_args: list[str] | None
+class SessionRequestDict(TypedDict, total=False):
+    session_id: str | None
+class SessionStartRequest(BaseModel):
+    timeout_minutes: Annotated[
+        int,
+        Field(
+            description="Session timeout in minutes. Cannot exceed the global timeout.",
+            gt=0,
+            le=DEFAULT_GLOBAL_SESSION_TIMEOUT_IN_MINUTES,
+        ),
+    ] = DEFAULT_OPERATION_SESSION_TIMEOUT_IN_MINUTES
+    max_steps: Annotated[
+        int,
+        Field(
+            gt=0,
+            description="Maximum number of steps in the trajectory. An error will be raised if this limit is reached.",
+        ),
+    ] = DEFAULT_MAX_NB_STEPS
+    proxies: Annotated[
+        list[ProxySettings] | bool,
+        Field(
+            description="List of custom proxies to use for the session. If True, the default proxies will be used.",
+        ),
+    ] = False
+    browser_type: BrowserType = BrowserType.CHROMIUM
+    chrome_args: Annotated[list[str] | None, Field(description="Override the chrome instance arguments")] = None
+    def __post_init__(self):
+        """
+        Validate that the session timeout does not exceed the allowed global limit.
+        Raises:
+            ValueError: If the session's timeout_minutes exceeds DEFAULT_GLOBAL_SESSION_TIMEOUT_IN_MINUTES.
+        """
+        if self.timeout_minutes > DEFAULT_GLOBAL_SESSION_TIMEOUT_IN_MINUTES:
+            raise ValueError(
+                (
+                    "Session timeout cannot be greater than global timeout: "
+                    f"{self.timeout_minutes} > {DEFAULT_GLOBAL_SESSION_TIMEOUT_IN_MINUTES}"
+                )
+            )
+class SessionRequest(BaseModel):
+    session_id: Annotated[
+        str | None,
+        Field(description="The ID of the session. A new session is created when not provided."),
+    ] = None
+class SessionStatusRequest(BaseModel):
+    session_id: Annotated[
+        str | None,
+        Field(description="The ID of the session. A new session is created when not provided."),
+    ] = None
+    replay: Annotated[
+        bool,
+        Field(description="Whether to include the video replay in the response (`.webp` format)."),
+    ] = False
+class ListRequestDict(TypedDict, total=False):
+    only_active: bool
+    limit: int
+class SessionListRequest(BaseModel):
+    only_active: bool = True
+    limit: int = DEFAULT_LIMIT_LIST_ITEMS
+class SessionResponse(BaseModel):
+    session_id: Annotated[
+        str,
+        Field(
+            description=(
+                "The ID of the session (created or existing). "
+                "Use this ID to interact with the session for the next operation."
+            )
+        ),
+    ]
+    timeout_minutes: Annotated[
+        int,
+        Field(description="Session timeout in minutes. Will timeout if now() > last access time + timeout_minutes"),
+    ]
+    created_at: Annotated[dt.datetime, Field(description="Session creation time")]
+    closed_at: Annotated[dt.datetime | None, Field(description="Session closing time")] = None
+    last_accessed_at: Annotated[dt.datetime, Field(description="Last access time")]
+    duration: Annotated[dt.timedelta, Field(description="Session duration")] = Field(
+        default_factory=lambda: dt.timedelta(0)
+    )
+    status: Annotated[
+        Literal["active", "closed", "error", "timed_out"],
+        Field(description="Session status"),
+    ]
+    # TODO: discuss if this is the best way to handle errors
+    error: Annotated[str | None, Field(description="Error message if the operation failed to complete")] = None
+    proxies: Annotated[
+        bool,
+        Field(
+            description="Whether proxies were used for the session. True if any proxy was applied during session creation."
+        ),
+    ] = False
+    browser_type: BrowserType = BrowserType.CHROMIUM
+    @field_validator("closed_at", mode="before")
+    @classmethod
+    def validate_closed_at(cls, value: dt.datetime | None, info: Any) -> dt.datetime | None:
+        data = info.data
+        if data.get("status") == "closed" and value is None:
+            raise ValueError("closed_at must be provided if status is closed")
+        return value
+    @field_validator("duration", mode="before")
+    @classmethod
+    def compute_duration(cls, value: dt.timedelta | None, info: Any) -> dt.timedelta:
+        data = info.data
+        if value is not None:
+            return value
+        if data.get("status") == "closed" and data.get("closed_at") is not None:
+            return data["closed_at"] - data["created_at"]
+        return dt.datetime.now() - data["created_at"]
+class SessionStatusResponse(SessionResponse, ReplayResponse):
+    pass
+class SessionResponseDict(TypedDict, total=False):
+    session_id: str
+    timeout_minutes: int
+    created_at: dt.datetime
+    last_accessed_at: dt.datetime
+    duration: dt.timedelta
+    closed_at: dt.datetime | None
+    status: Literal["active", "closed", "error", "timed_out"]
+    error: str | None
+    proxies: bool
+    browser_type: BrowserType
+# ############################################################
+# Session debug endpoints
+# ############################################################
+class TabSessionDebugRequest(BaseModel):
+    tab_idx: int
+class TabSessionDebugResponse(BaseModel):
+    metadata: TabsData
+    debug_url: str
+    ws_url: str
+class WebSocketUrls(BaseModel):
+    cdp: Annotated[str, Field(description="WebSocket URL to connect using CDP protocol")]
+    recording: Annotated[str, Field(description="WebSocket URL for live session recording (screenshot stream)")]
+    logs: Annotated[str, Field(description="WebSocket URL for live logs (obsveration / actions events)")]
+class SessionDebugResponse(BaseModel):
+    debug_url: str
+    ws: WebSocketUrls
+    tabs: list[TabSessionDebugResponse]
+class SessionDebugRecordingEvent(BaseModel):
+    """Model for events that can be sent over the recording WebSocket"""
+    type: Literal["action", "observation", "error"]
+    data: BaseAction | Observation | str
+    timestamp: dt.datetime = Field(default_factory=dt.datetime.now)
+    @staticmethod
+    def session_closed() -> "SessionDebugRecordingEvent":
+        return SessionDebugRecordingEvent(
+            type="error",
+            data="Session closed by user. No more actions will be recorded.",
+        )
+# ############################################################
+# Persona
+# ############################################################
+class EmailsReadRequestDict(TypedDict, total=False):
+    limit: int
+    timedelta: dt.timedelta | None
+    unread_only: bool
+class EmailsReadRequest(BaseModel):
+    limit: Annotated[int, Field(description="Max number of emails to return")] = DEFAULT_LIMIT_LIST_ITEMS
+    timedelta: Annotated[
+        dt.timedelta | None, Field(description="Return only emails that are not older than <timedelta>")
+    ] = None
+    unread_only: Annotated[bool, Field(description="Return only previously unread emails")] = False
+class EmailResponse(BaseModel):
+    subject: Annotated[str, Field(description="Subject of the email")]
+    email_id: Annotated[str, Field(description="Email UUID")]
+    created_at: Annotated[dt.datetime, Field(description="Creation date")]
+    sender_email: Annotated[str | None, Field(description="Email address of the sender")]
+    sender_name: Annotated[str | None, Field(description="Name (if available) of the sender")]
+    text_content: Annotated[
+        str | None, Field(description="Raw textual body, can be uncorrelated with html content")
+    ] = None
+    html_content: Annotated[str | None, Field(description="HTML body, can be uncorrelated with raw content")] = None
+class SMSReadRequestDict(TypedDict, total=False):
+    limit: int
+    timedelta: dt.timedelta | None
+    unread_only: bool
+class SMSReadRequest(BaseModel):
+    limit: Annotated[int, Field(description="Max number of messages to return")] = DEFAULT_LIMIT_LIST_ITEMS
+    timedelta: Annotated[
+        dt.timedelta | None, Field(description="Return only messages that are not older than <timedelta>")
+    ] = None
+    unread_only: Annotated[bool, Field(description="Return only previously unread messages")] = False
+class SMSResponse(BaseModel):
+    body: Annotated[str, Field(description="SMS message body")]
+    sms_id: Annotated[str, Field(description="SMS UUID")]
+    created_at: Annotated[dt.datetime, Field(description="Creation date")]
+    sender: Annotated[str | None, Field(description="SMS sender phone number")]
+class PersonaCreateRequestDict(TypedDict, total=False):
+    pass
+class PersonaCreateRequest(BaseModel):
+    pass
+class PersonaCreateResponse(BaseModel):
+    persona_id: Annotated[str, Field(description="ID of the created persona")]
+class VirtualNumberRequestDict(TypedDict, total=False):
+    pass
+class VirtualNumberRequest(BaseModel):
+    pass
+class VirtualNumberResponse(BaseModel):
+    status: Annotated[str, Field(description="Status of the created virtual number")]
+class AddCredentialsRequestDict(CredentialsDict, total=False):
+    url: str | None
+def validate_url(value: str | None) -> str | None:
+    if value is None:
+        return None
+    domain_url = get_root_domain(value)
+    if len(domain_url) == 0:
+        raise ValueError(f"Invalid URL: {value}. Please provide a valid URL with a domain name.")
+    return domain_url
+class AddCredentialsRequest(BaseModel):
+    url: str | None
+    credentials: Annotated[list[CredentialField], Field(description="Credentials to add")]
+    @field_validator("url", mode="before")
+    @classmethod
+    def validate_url(cls, value: str | None) -> str | None:
+        return validate_url(value)
+    @staticmethod
+    def load(body: dict[str, Any]) -> "AddCredentialsRequest":
+        url = body.get("url")
+        creds = [CredentialField.from_dict(field) for field in body["credentials"]]
+        return AddCredentialsRequest(url=url, credentials=creds)
+    @classmethod
+    def from_request_dict(cls, dic: AddCredentialsRequestDict):
+        if "url" not in dic:
+            raise ValueError("Invalid credentials request dict")
+        no_url = dic.copy()
+        del no_url["url"]
+        creds = BaseVault.credentials_dict_to_field(no_url)
+        return AddCredentialsRequest(url=dic["url"], credentials=creds)
+class AddCredentialsResponse(BaseModel):
+    status: Annotated[str, Field(description="Status of the created credentials")]
+class GetCredentialsRequestDict(TypedDict, total=False):
+    url: str | None
+class GetCredentialsRequest(BaseModel):
+    url: str | None
+    @field_validator("url", mode="before")
+    @classmethod
+    def validate_url(cls, value: str | None) -> str | None:
+        return validate_url(value)
+class GetCredentialsResponse(BaseModel):
+    credentials: Annotated[list[CredentialField], Field(description="Retrieved credentials")]
+class DeleteCredentialsRequestDict(TypedDict, total=False):
+    url: str | None
+class DeleteCredentialsRequest(BaseModel):
+    url: str | None
+    @field_validator("url", mode="before")
+    @classmethod
+    def validate_url(cls, value: str | None) -> str | None:
+        return validate_url(value)
+class DeleteCredentialsResponse(BaseModel):
+    status: Annotated[str, Field(description="Status of the deletion")]
+# ############################################################
+# Environment endpoints
+# ############################################################
+class PaginationParamsDict(TypedDict, total=False):
+    min_nb_actions: int | None
+    max_nb_actions: int
+class PaginationParams(BaseModel):
+    min_nb_actions: Annotated[
+        int | None,
+        Field(
+            description=(
+                "The minimum number of actions to list before stopping. "
+                "If not provided, the listing will continue until the maximum number of actions is reached."
+            ),
+        ),
+    ] = None
+    max_nb_actions: Annotated[
+        int,
+        Field(
+            description=(
+                "The maximum number of actions to list after which the listing will stop. "
+                "Used when min_nb_actions is not provided."
+            ),
+        ),
+    ] = DEFAULT_MAX_NB_ACTIONS
+class ObserveRequest(PaginationParams):
+    url: Annotated[
+        str | None,
+        Field(description="The URL to observe. If not provided, uses the current page URL."),
+    ] = None
+class ObserveRequestDict(PaginationParamsDict, total=False):
+    url: str | None
+class ScrapeParamsDict(TypedDict, total=False):
+    scrape_links: bool
+    only_main_content: bool
+    response_format: type[BaseModel] | None
+    instructions: str | None
+    use_llm: bool | None
+class ScrapeRequestDict(ScrapeParamsDict, total=False):
+    url: str | None
+class ScrapeParams(BaseModel):
+    scrape_links: Annotated[
+        bool,
+        Field(description="Whether to scrape links from the page. Links are scraped by default."),
+    ] = True
+    only_main_content: Annotated[
+        bool,
+        Field(
+            description=(
+                "Whether to only scrape the main content of the page. If True, navbars, footers, etc. are excluded."
+            ),
+        ),
+    ] = True
+    response_format: Annotated[
+        type[BaseModel] | None,
+        Field(description="The response format to use for the scrape."),
+    ] = None
+    instructions: Annotated[str | None, Field(description="The instructions to use for the scrape.")] = None
+    use_llm: Annotated[
+        bool | None,
+        Field(
+            description=(
+                "Whether to use an LLM for the extraction process. This will result in a longer response time but a"
+                " better accuracy. If not provided, the default value is the same as the NotteSession config."
+            )
+        ),
+    ] = None
+    def requires_schema(self) -> bool:
+        return self.response_format is not None or self.instructions is not None
+    @field_validator("response_format", mode="before")
+    @classmethod
+    def convert_response_format(cls, value: dict[str, Any] | type[BaseModel] | None) -> type[BaseModel] | None:
+        """
+        Creates a Pydantic model from a given JSON Schema.
+        Args:
+            schema_name: The name of the model to be created.
+            schema_json: The JSON Schema definition.
+        Returns:
+            The dynamically created Pydantic model class.
+        """
+        if value is None:
+            return None
+        if isinstance(value, type) and issubclass(value, BaseModel):  # type: ignore[arg-type]
+            return value
+        if not isinstance(value, dict):  # type: ignore[arg-type]
+            raise ValueError(f"response_format must be a BaseModel or a dict but got: {type(value)} : {value}")  # type: ignore[unreachable]
+        if len(value.keys()) == 0:
+            return None
+        return create_model_from_schema(value)
+    @override
+    def model_dump(self, *args: Any, **kwargs: Any) -> dict[str, Any]:
+        dump = super().model_dump(*args, **kwargs)
+        if isinstance(self.response_format, type) and issubclass(self.response_format, BaseModel):  # pyright: ignore[reportUnnecessaryIsInstance]
+            dump["response_format"] = self.response_format.model_json_schema()
+        return dump
+    @override
+    def model_dump_json(self, *args: Any, **kwargs: Any) -> str:
+        dump = self.model_dump(*args, **kwargs)
+        if isinstance(self.response_format, type) and issubclass(self.response_format, BaseModel):  # pyright: ignore[reportUnnecessaryIsInstance]
+            dump["response_format"] = self.response_format.model_json_schema()
+        return json.dumps(dump)
+class ScrapeRequest(ScrapeParams):
+    url: Annotated[
+        str | None,
+        Field(description="The URL to scrape. If not provided, uses the current page URL."),
+    ] = None
+class StepRequest(PaginationParams):
+    action_id: Annotated[str, Field(description="The ID of the action to execute")]
+    value: Annotated[str | None, Field(description="The value to input for form actions")] = None
+    enter: Annotated[
+        bool | None,
+        Field(description="Whether to press enter after inputting the value"),
+    ] = None
+class StepRequestDict(PaginationParamsDict, total=False):
+    action_id: str
+    value: str | None
+    enter: bool | None
+class ActionSpaceResponse(BaseModel):
+    markdown: Annotated[str | None, Field(description="Markdown representation of the action space")] = None
+    actions: Annotated[
+        Sequence[Action],
+        Field(description="List of available actions in the current state"),
+    ]
+    browser_actions: Annotated[
+        Sequence[BrowserAction],
+        Field(description="List of special actions, i.e browser actions"),
+    ]
+    # TODO: ActionSpaceResponse should be a subclass of ActionSpace
+    description: str
+    category: str | None = None
+    @staticmethod
+    def from_space(space: BaseActionSpace) -> "ActionSpaceResponse":
+        return ActionSpaceResponse(
+            markdown=space.markdown(),
+            description=space.description,
+            category=space.category,
+            actions=space.actions(),  # type: ignore[arg-type]
+            browser_actions=space.browser_actions(),  # type: ignore[arg-type]
+        )
+class ScrapeResponse(BaseModel):
+    session: Annotated[SessionResponse, Field(description="Browser session information")]
+    data: Annotated[DataSpace, Field(description="Data extracted from the current page")]
+class ObserveResponse(BaseModel):
+    session: Annotated[SessionResponse, Field(description="Browser session information")]
+    space: Annotated[
+        ActionSpaceResponse,
+        Field(description="Available actions in the current state"),
+    ]
+    metadata: SnapshotMetadata
+    screenshot: bytes | None = Field(repr=False)
+    data: DataSpace | None
+    progress: TrajectoryProgress | None
+    model_config = {  # type: ignore[attr-defined]
+        "json_encoders": {
+            bytes: lambda v: b64encode(v).decode("utf-8") if v else None,
+        }
+    }
+    @override
+    def model_dump(self, *args: Any, **kwargs: Any) -> dict[str, Any]:
+        data = super().model_dump(*args, **kwargs)
+        if self.screenshot is not None:
+            data["screenshot"] = b64encode(self.screenshot).decode("utf-8")
+        return data
+    @staticmethod
+    def from_obs(
+        obs: Observation,
+        session: SessionResponse,
+    ) -> "ObserveResponse":
+        return ObserveResponse(
+            session=session,
+            metadata=obs.metadata,
+            screenshot=obs.screenshot,
+            data=obs.data,
+            space=ActionSpaceResponse.from_space(obs.space),
+            progress=obs.progress,
+        )
+# ############################################################
+# Agent endpoints
+# ############################################################
+class AgentStatus(StrEnum):
+    active = "active"
+    closed = "closed"
+class AgentSessionRequest(BaseModel):
+    agent_id: Annotated[str, Field(description="The ID of the agent to run")]
+class AgentCreateRequestDict(SessionRequestDict, total=False):
+    reasoning_model: LlmModel
+    use_vision: bool
+    max_steps: int
+    persona_id: str | None
+    vault_id: str | None
+class AgentRunRequestDict(TypedDict, total=False):
+    task: Required[str]
+    url: str | None
+class AgentStartRequestDict(AgentCreateRequestDict, AgentRunRequestDict, total=False):
+    pass
+class AgentCreateRequest(SessionRequest):
+    reasoning_model: Annotated[LlmModel, Field(description="The reasoning model to use")] = LlmModel.default()
+    use_vision: Annotated[
+        bool, Field(description="Whether to use vision for the agent. Not all reasoning models support vision.")
+    ] = True
+    max_steps: Annotated[int, Field(description="The maximum number of steps the agent should take")] = (
+        DEFAULT_MAX_NB_STEPS
+    )
+    persona_id: Annotated[str | None, Field(description="The persona to use for the agent")] = None
+    vault_id: Annotated[str | None, Field(description="The vault to use for the agent")] = None
+class AgentRunRequest(BaseModel):
+    task: Annotated[str, Field(description="The task that the agent should perform")]
+    url: Annotated[str | None, Field(description="The URL that the agent should start on (optional)")] = None
+class AgentStartRequest(AgentCreateRequest, AgentRunRequest):
+    pass
+class AgentStatusRequestDict(TypedDict, total=False):
+    agent_id: Required[Annotated[str, Field(description="The ID of the agent for which to get the status")]]
+    replay: bool
+class AgentStatusRequest(AgentSessionRequest):
+    replay: Annotated[bool, Field(description="Whether to include the replay in the response")] = False
+class AgentListRequest(SessionListRequest):
+    pass
+class AgentStopRequest(AgentSessionRequest, ReplayResponse):
+    success: Annotated[bool, Field(description="Whether the agent task was successful")] = False
+    answer: Annotated[str, Field(description="The answer to the agent task")] = "Agent manually stopped by user"
+class AgentResponse(BaseModel):
+    agent_id: Annotated[str, Field(description="The ID of the agent")]
+    created_at: Annotated[dt.datetime, Field(description="The creation time of the agent")]
+    session_id: Annotated[str, Field(description="The ID of the session")]
+    status: Annotated[AgentStatus, Field(description="The status of the agent (active or closed)")]
+    closed_at: Annotated[dt.datetime | None, Field(description="The closing time of the agent")] = None
+TStepOutput = TypeVar("TStepOutput", bound=BaseModel)
+class AgentStatusResponse(AgentResponse, ReplayResponse, Generic[TStepOutput]):
+    task: Annotated[str, Field(description="The task that the agent is currently running")]
+    url: Annotated[str | None, Field(description="The URL that the agent started on")] = None
+    success: Annotated[
+        bool | None,
+        Field(description="Whether the agent task was successful. None if the agent is still running"),
+    ] = None
+    answer: Annotated[
+        str | None,
+        Field(description="The answer to the agent task. None if the agent is still running"),
+    ] = None
+    steps: Annotated[
+        list[TStepOutput],
+        Field(description="The steps that the agent has currently taken"),
+    ] = Field(default_factory=lambda: [])