PyPI - clerk-sdk - Versions diffs - 0.1.9__tar.gz → 0.2.1__tar.gz - Mend

clerk-sdk 0.1.9tar.gz → 0.2.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

clerk_sdk-0.2.1/MANIFEST.in ADDED Viewed

@@ -0,0 +1,3 @@
+include requirements.txt
+include clerk/gui_automation/requirements.txt
+include README.md

{clerk_sdk-0.1.9/clerk_sdk.egg-info → clerk_sdk-0.2.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: clerk-sdk
-Version: 0.1.9
+Version: 0.2.1
 Summary: Library for interacting with Clerk
 Home-page: https://github.com/F-ONE-Group/clerk_pypi
 Author: F-ONE Group
@@ -14,6 +14,15 @@ License-File: LICENSE
 Requires-Dist: pydantic<3.0.0,>=2.0.0
 Requires-Dist: backoff<3.0.0,>=2.0.0
 Requires-Dist: requests<3.0.0,>=2.32.3
+Provides-Extra: all
+Requires-Dist: pydantic<3.0.0,>=2.0.0; extra == "all"
+Requires-Dist: backoff<3.0.0,>=2.0.0; extra == "all"
+Requires-Dist: requests<3.0.0,>=2.32.3; extra == "all"
+Requires-Dist: networkx<4.0.0,>=3.5.0; extra == "all"
+Requires-Dist: websockets>=15.0.1; extra == "all"
+Provides-Extra: gui-automation
+Requires-Dist: networkx<4.0.0,>=3.5.0; extra == "gui-automation"
+Requires-Dist: websockets>=15.0.1; extra == "gui-automation"
 Dynamic: author
 Dynamic: author-email
 Dynamic: classifier
@@ -21,6 +30,7 @@ Dynamic: description
 Dynamic: description-content-type
 Dynamic: home-page
 Dynamic: license-file
+Dynamic: provides-extra
 Dynamic: requires-dist
 Dynamic: requires-python
 Dynamic: summary

clerk_sdk-0.1.9/clerk/client.py → clerk_sdk-0.2.1/clerk/base.py RENAMED Viewed

@@ -1,34 +1,15 @@
 import os
-# import logging
 import requests
 import backoff
-from typing import Dict, List, Optional, Self
-from xml.dom.minidom import Document
+from typing import Dict, Optional, Self
 from pydantic import BaseModel, model_validator, Field
-from .models.file import ParsedFile
 from .models.response_model import StandardResponse
-# logger = logging.getLogger(__name__)
-# logger.setLevel(logging.INFO)
-# if not logger.handlers:
-#     handler = logging.StreamHandler()
-#     formatter = logging.Formatter("[%(levelname)s] %(asctime)s - %(message)s")
-#     handler.setFormatter(formatter)
-#     logger.addHandler(handler)
-# def backoff_handler(details):
-#     logger.warning(
-#         f"Retrying {details['target'].__name__} after {details['tries']} tries..."
-#     )
 def giveup_handler(e):
     return (
         isinstance(e, requests.exceptions.HTTPError)
@@ -37,12 +18,13 @@ def giveup_handler(e):
     )
-class Clerk(BaseModel):
+class BaseClerk(BaseModel):
     api_key: Optional[str] = Field(default=None, min_length=1)
     headers: Dict[str, str] = Field(default_factory=dict)
     base_url: str = Field(
         default_factory=lambda: os.getenv("CLERK_BASE_URL", "https://api.clerk-app.com")
     )
+    root_endpoint: Optional[str] = None
     @model_validator(mode="after")
     def validate_api_key(self) -> Self:
@@ -73,6 +55,8 @@ class Clerk(BaseModel):
         merged_headers = {**self.headers, **headers}
         url = f"{self.base_url}{endpoint}"
+        if self.root_endpoint:
+            url = f"{self.base_url}{self.root_endpoint}{endpoint}"
         # logger.info(f"GET {url} | params={params}")
@@ -99,6 +83,8 @@ class Clerk(BaseModel):
         merged_headers = {**self.headers, **headers}
         url = f"{self.base_url}{endpoint}"
+        if self.root_endpoint:
+            url = f"{self.base_url}{self.root_endpoint}{endpoint}"
         # logger.info(f"POST {url} | body={json} | params={params}")
@@ -106,13 +92,3 @@ class Clerk(BaseModel):
         response.raise_for_status()
         return StandardResponse(**response.json())
-    def get_document(self, document_id: str) -> Document:
-        endpoint = f"/document/{document_id}"
-        res = self.get_request(endpoint=endpoint)
-        return Document(**res.data[0])
-    def get_files_document(self, document_id: str) -> List[ParsedFile]:
-        endpoint = f"/document/{document_id}/files"
-        res = self.get_request(endpoint=endpoint)
-        return [ParsedFile(**d) for d in res.data]

clerk_sdk-0.2.1/clerk/client.py ADDED Viewed

@@ -0,0 +1,17 @@
+from typing import List
+from xml.dom.minidom import Document
+from clerk.base import BaseClerk
+from .models.file import ParsedFile
+class Clerk(BaseClerk):
+    def get_document(self, document_id: str) -> Document:
+        endpoint = f"/document/{document_id}"
+        res = self.get_request(endpoint=endpoint)
+        return Document(**res.data[0])
+    def get_files_document(self, document_id: str) -> List[ParsedFile]:
+        endpoint = f"/document/{document_id}/files"
+        res = self.get_request(endpoint=endpoint)
+        return [ParsedFile(**d) for d in res.data]

{clerk_sdk-0.1.9 → clerk_sdk-0.2.1}/clerk/decorator/models.py RENAMED Viewed

@@ -17,3 +17,4 @@ class Document(BaseModel):
 class ClerkCodePayload(BaseModel):
     document: Document
     structured_data: Dict
+    run_id: Optional[str] = None

{clerk_sdk-0.1.9 → clerk_sdk-0.2.1}/clerk/decorator/task_decorator.py RENAMED Viewed

@@ -1,3 +1,4 @@
+import os
 import pickle
 from typing import Callable, Optional
 from functools import wraps

clerk_sdk-0.2.1/clerk/gui_automation/action_model/__init__.py ADDED Viewed

File without changes

clerk_sdk-0.2.1/clerk/gui_automation/action_model/model.py ADDED Viewed

@@ -0,0 +1,126 @@
+import base64
+import os
+from typing import List, Literal, Optional, Union
+from pydantic import BaseModel, Field, validator
+CoordsType = Union[List[float], List[int]]
+PredictionsFormat = Union[
+    Literal["xyxy"], Literal["xyxyn"], Literal["xywh"], Literal["xywhn"]
+]
+RelationsType = Union[
+    Literal["above"], Literal["below"], Literal["left"], Literal["right"], Literal[""]
+]
+class ImageB64(BaseModel):
+    """
+    A class representing an image encoded in base64 format.
+    Attributes:
+        id (Optional[str]): The ID of the image. Defaults to None.
+        value (str): The base64 encoded value of the image.
+    Methods:
+        from_path(value: Union[str, "ImageB64"]) -> "ImageB64":
+            Creates an ImageB64 instance from a file path or an existing ImageB64 instance.
+            Args:
+                value (Union[str, "ImageB64"]): The file path or an existing ImageB64 instance.
+            Returns:
+                ImageB64: The created ImageB64 instance.
+        _to_b64(path: str) -> str:
+            Encodes the image file at the given path to base64 format.
+            Args:
+                path (str): The path to the image file.
+            Returns:
+                str: The base64 encoded image.
+    """
+    id: Optional[str] = None
+    value: str = ""
+    @classmethod
+    def from_path(cls, value: Union[str, "ImageB64"]) -> "ImageB64":
+        if isinstance(value, ImageB64):
+            return value
+        return ImageB64(
+            id=os.path.basename(value),
+            value=to_b64(value),
+        )
+def to_b64(path: str) -> str:
+    with open(path, "rb") as f:
+        img_b64: str = base64.b64encode(f.read()).decode("utf-8")
+    return img_b64
+class Anchor(BaseModel):
+    """
+    A class representing an anchor for a screenshot.
+    Attributes:
+        value (Union[str, ImageB64]): The value of the anchor, which can be a string or an ImageB64 instance.
+        relation (RelationsType): The relation of the anchor to the target, which can be one of the following: "above", "below", "left", "right", or an empty string.
+    """
+    value: Union[str, ImageB64] = ""
+    relation: RelationsType = ""
+class Screenshot(BaseModel):
+    """
+    A class representing a screenshot.
+    Attributes:
+        screen_b64 (ImageB64): The base64 encoded value of the screenshot.
+        target (Union[str, ImageB64]): The target of the screenshot, which can be a string or an ImageB64 instance.
+        anchors (List[Anchor]): The list of anchors for the screenshot.
+        is_awaited (bool): A flag to signal whether the target should appear immediately or is awaited.
+        target_name (Optional[str]): A readable representation of a target which is set automatically when validating the target and is used in the AM for logging.
+    """
+    screen_b64: ImageB64
+    target: Union[str, ImageB64]
+    anchors: List[Anchor] = []
+    is_awaited: bool = False
+    target_name: Optional[str] = None
+class Coords(BaseModel):
+    """
+    A class representing coordinates.
+    Attributes:
+        value (CoordsType): The value of the coordinates, which can be a list of floats or a list of integers.
+        score (int): The score associated with the coordinates, defaults to 0.
+    """
+    value: CoordsType
+    score: int = 0
+class RouterOutput(BaseModel):
+    """
+    A class representing the output of a router.
+    Attributes:
+        Resources (List[Coords]): A list of coordinates representing the resources.
+        StatusMessage (Union[Literal["Success"], Literal["Failure"], None]): The status message of the router output.
+        ErrorMessage (str): The error message associated with the router output.
+    """
+    Resources: List[Coords] = []
+    StatusMessage: Union[Literal["Success"], Literal["Failure"], None] = None
+    ErrorMessage: str = ""

clerk_sdk-0.2.1/clerk/gui_automation/action_model/utils.py ADDED Viewed

@@ -0,0 +1,26 @@
+from .model import Coords, Screenshot
+from ..decorators.gui_automation import clerk_client
+def get_coordinates(payload: Screenshot) -> Coords:
+    """
+    Get coordinates from the action model API endpoint.
+    The method requires the following environmental variables to work:
+        - AM_URL: action model URL
+    Parameters:
+        payload (Screenshot): The payload containing the necessary data for the request.
+    Returns:
+        Coords: The coordinates obtained from the API response.
+    Raises:
+        RuntimeError: If the API response status code is not 200.
+    Example:
+        payload = Screenshot(screen_b64="base64_encoded_image", target="target_image")
+        coordinates = get_coordinates(payload)
+    """
+    return clerk_client.get_coordinates(payload.model_dump())

clerk_sdk-0.2.1/clerk/gui_automation/client.py ADDED Viewed

@@ -0,0 +1,148 @@
+from typing import Dict, List, Optional
+from pydantic import BaseModel
+from clerk.base import BaseClerk
+from clerk.gui_automation.action_model.model import Coords
+from clerk.gui_automation.exceptions.agent_manager import NoClientsAvailable
+from clerk.gui_automation.ui_state_inspector.models import (
+    ActionString,
+    BaseState,
+    States,
+    TargetWithAnchor,
+)
+from clerk.models.remote_device import RemoteDevice
+class RPAClerk(BaseClerk):
+    root_endpoint: str = "/gui_automation"
+    def allocate_remote_device(self, group_name: str, run_id: str):
+        endpoint = "/remote_device/allocate"
+        res = self.post_request(
+            endpoint=endpoint, json={"group_name": group_name, "run_id": run_id}
+        )
+        if res.data[0] is None:
+            raise NoClientsAvailable()
+        return RemoteDevice(**res.data[0])
+    def deallocate_remote_device(
+        self,
+        remote_device: RemoteDevice,
+        run_id: str,
+    ):
+        endpoint = "/remote_device/deallocate"
+        self.post_request(
+            endpoint=endpoint,
+            json={"id": remote_device.id, "name": remote_device.name, "run_id": run_id},
+        )
+    def get_coordinates(self, payload: Dict) -> Coords:
+        endpoint = "/action_model/get_coordinates"
+        res = self.post_request(endpoint=endpoint, json=payload)
+        if res.data[0] is None:
+            raise RuntimeError("No coordinates found in the response.")
+        return Coords(**res.data[0])
+class GUIVisionClerk(BaseClerk):
+    root_endpoint: str = "/gui_automation/vision"
+    def find_target(self, screen_b64: str, use_ocr: bool, target_prompt: str):
+        endpoint = "/find_target"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "target_prompt": target_prompt,
+            },
+        )
+        return TargetWithAnchor(**res.data[0])
+    def verify_state(
+        self, screen_b64: str, use_ocr: bool, possible_states: States
+    ) -> BaseState:
+        endpoint = "/verify_state"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "possible_states": possible_states,
+            },
+        )
+        return BaseState(**res.data[0])
+    def answer(
+        self, screen_b64: str, use_ocr: bool, question: str, output_model: BaseModel
+    ) -> Dict:
+        endpoint = "/answer"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "question": question,
+                "output_model": output_model.model_json_schema(),
+            },
+        )
+        return output_model(**res.data[0])
+    def classify_state(
+        self, screen_b64: str, use_ocr: bool, possible_states: List[Dict[str, str]]
+    ) -> BaseState:
+        endpoint = "/classify_state"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "possible_states": possible_states,
+            },
+        )
+        return BaseState(**res.data[0])
+    def write_action_string(
+        self, screen_b64: str, use_ocr: bool, action_prompt: str
+    ) -> ActionString:
+        endpoint = "/write_action-string"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "action_prompt": action_prompt,
+            },
+        )
+        return ActionString(**res.data[0])
+class CourseCorrectorClerk(BaseClerk):
+    root_endpoint: str = "/gui_automation/course_corrector"
+    def get_corrective_actions(
+        self,
+        screen_b64: str,
+        use_ocr: str,
+        goal: str,
+        custom_instructions: Optional[str] = None,
+    ) -> ActionString:
+        endpoint = "/get_corrective_actions"
+        res = self.post_request(
+            endpoint=endpoint,
+            json={
+                "screen_b64": screen_b64,
+                "use_ocr": use_ocr,
+                "goal": goal,
+                "custom_instructions": custom_instructions,
+            },
+        )
+        return ActionString(**res.data[0])

clerk_sdk-0.2.1/clerk/gui_automation/client_actor/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+from .client_actor import (
+    get_screen,
+    perform_action,
+)

clerk_sdk-0.2.1/clerk/gui_automation/client_actor/client_actor.py ADDED Viewed

@@ -0,0 +1,176 @@
+import asyncio
+import json
+import os
+from typing import Any, Dict, Union
+import pydantic
+import requests
+from .model import (
+    ExecutePayload,
+    DeleteFilesExecutePayload,
+    ApplicationExecutePayload,
+    SaveFilesExecutePayload,
+    WindowExecutePayload,
+    GetFileExecutePayload,
+)
+import backoff
+from .model import PerformActionResponse, ActionStates
+from .exception import PerformActionException, GetScreenError
+async def _perform_action_ws(payload: Dict) -> PerformActionResponse:
+    """Perform an action over a WebSocket connection.
+    Args:
+        payload (Dict): The payload request to be sent.
+    Returns:
+        PerformActionResponse: The response of performing the action.
+    Raises:
+        RuntimeError: If the ACK message is not received within the specified timeout.
+    """
+    from ..decorators.gui_automation import global_ws
+    # 1. Send the payload request
+    if global_ws:
+        await global_ws.send(json.dumps(payload))
+        # 2. wait for ack message
+        try:
+            ack = await asyncio.wait_for(global_ws.recv(), 90)
+            if ack == "OK":
+                action_info = await asyncio.wait_for(global_ws.recv(), 90)
+                return PerformActionResponse(**json.loads(action_info))
+            else:
+                raise RuntimeError("Received ACK != OK")
+        except asyncio.TimeoutError:
+            raise RuntimeError("The ack message did not arrive.")
+    else:
+        raise RuntimeError("The Websocket has not been initiated.")
+async def _get_screen_async() -> str:
+    """
+    Asynchronously retrieves a screen using a WebSocket connection.
+    Returns:
+        str: The base64 encoded screen image.
+    Note:
+        This function sends a request to perform a screenshot action over a WebSocket connection
+        and returns the base64 encoded image of the screen captured.
+    """
+    payload = {
+        "proc_inst_id": os.getenv("PROC_ID"),
+        "client_name": os.getenv("REMOTE_DEVICE_NAME"),
+        "headless": True,
+        "action": {"action_type": "screenshot"},
+    }
+    try:
+        action_info = await _perform_action_ws(payload)
+    except Exception as e:
+        if str(e) in (
+            "The ack message did not arrive.",
+            "Received ACK != OK",
+        ):
+            raise GetScreenError("The ack message did not arrive.")
+        raise  # else raise the error
+    if action_info.screen_b64 is not None:
+        return action_info.screen_b64
+    raise GetScreenError()
+@backoff.on_exception(
+    backoff.expo,
+    (requests.RequestException, pydantic.ValidationError, GetScreenError),
+    max_time=120,
+)
+def get_screen() -> str:
+    """
+    Request the VDI screen and return the base64 representation of the screenshot.
+    Returns:
+        str: The base64 representation of the screenshot.
+    Raises:
+        RuntimeError: If the request to the VDI screen fails.
+    """
+    loop = asyncio.get_event_loop()
+    # asyncio.set_event_loop(loop)
+    task = loop.create_task(_get_screen_async())
+    res = loop.run_until_complete(task)
+    return res
+async def _perform_action_async(
+    payload: Union[
+        ExecutePayload,
+        ApplicationExecutePayload,
+        WindowExecutePayload,
+        SaveFilesExecutePayload,
+        DeleteFilesExecutePayload,
+        GetFileExecutePayload,
+    ],
+) -> Any:
+    """
+    Perform an asynchronous action based on the provided payload.
+    Args:
+        payload (Union[ExecutePayload, ApplicationExecutePayload, WindowExecutePayload, SaveFilesExecutePayload, DeleteFilesExecutePayload, GetFileExecutePayload]): The payload containing information about the action to be performed.
+    Returns:
+        Any: The return value of the action.
+    Raises:
+        PerformActionException: If the action fails with an error message.
+    """
+    req_payload: Dict = {
+        "proc_inst_id": os.getenv("PROC_ID"),
+        "client_name": os.getenv("REMOTE_DEVICE_NAME"),
+        "headless": (
+            True if os.getenv("HEADLESS", "True").lower() == "true" else False
+        ),
+        "action": payload.model_dump(),
+    }
+    action_info = await _perform_action_ws(req_payload)
+    if action_info.state == ActionStates.failed:
+        raise PerformActionException(action_info.message)
+    return action_info.return_value
+def perform_action(
+    payload: Union[
+        ExecutePayload,
+        ApplicationExecutePayload,
+        WindowExecutePayload,
+        SaveFilesExecutePayload,
+        DeleteFilesExecutePayload,
+        GetFileExecutePayload,
+    ],
+) -> Any:
+    """
+    Perform an action on the VDI client.
+    Args:
+        payload (Union[ExecutePayload, ApplicationExecutePayload, WindowExecutePayload]): The payload containing the details of the action to be performed.
+    Raises:
+        PerformActionException: If the action fails.
+        RuntimeError: If the request to perform the action fails.
+    Returns:
+        Any
+    """
+    loop = asyncio.get_event_loop()
+    task = loop.create_task(_perform_action_async(payload))
+    res = loop.run_until_complete(task)
+    return res

clerk_sdk-0.2.1/clerk/gui_automation/client_actor/exception.py ADDED Viewed

@@ -0,0 +1,22 @@
+class PerformActionException(Exception):
+    """
+    A custom exception class for handling errors related to performing actions.
+    """
+    pass
+class GetScreenError(Exception):
+    """
+    A custom exception class for handling errors related to getting the screen.
+    """
+    pass
+class WebSocketConnectionFailed(Exception):
+    """
+    Connection to websocket was not successful
+    """
+    pass

clerk-sdk 0.1.9__tar.gz → 0.2.1__tar.gz

clerk-sdk 0.1.9tar.gz → 0.2.1tar.gz