PyPI - optexity - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

optexity 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (76) hide show

optexity/examples/__init__.py +0 -0
optexity/examples/add_example.py +88 -0
optexity/examples/download_pdf_url.py +29 -0
optexity/examples/extract_price_stockanalysis.py +44 -0
optexity/examples/file_upload.py +59 -0
optexity/examples/i94.py +126 -0
optexity/examples/i94_travel_history.py +126 -0
optexity/examples/peachstate_medicaid.py +201 -0
optexity/examples/supabase_login.py +75 -0
optexity/inference/__init__.py +0 -0
optexity/inference/agents/__init__.py +0 -0
optexity/inference/agents/error_handler/__init__.py +0 -0
optexity/inference/agents/error_handler/error_handler.py +39 -0
optexity/inference/agents/error_handler/prompt.py +60 -0
optexity/inference/agents/index_prediction/__init__.py +0 -0
optexity/inference/agents/index_prediction/action_prediction_locator_axtree.py +45 -0
optexity/inference/agents/index_prediction/prompt.py +14 -0
optexity/inference/agents/select_value_prediction/__init__.py +0 -0
optexity/inference/agents/select_value_prediction/prompt.py +20 -0
optexity/inference/agents/select_value_prediction/select_value_prediction.py +39 -0
optexity/inference/agents/two_fa_extraction/__init__.py +0 -0
optexity/inference/agents/two_fa_extraction/prompt.py +23 -0
optexity/inference/agents/two_fa_extraction/two_fa_extraction.py +47 -0
optexity/inference/child_process.py +251 -0
optexity/inference/core/__init__.py +0 -0
optexity/inference/core/interaction/__init__.py +0 -0
optexity/inference/core/interaction/handle_agentic_task.py +79 -0
optexity/inference/core/interaction/handle_check.py +57 -0
optexity/inference/core/interaction/handle_click.py +79 -0
optexity/inference/core/interaction/handle_command.py +261 -0
optexity/inference/core/interaction/handle_input.py +76 -0
optexity/inference/core/interaction/handle_keypress.py +16 -0
optexity/inference/core/interaction/handle_select.py +109 -0
optexity/inference/core/interaction/handle_select_utils.py +132 -0
optexity/inference/core/interaction/handle_upload.py +59 -0
optexity/inference/core/interaction/utils.py +81 -0
optexity/inference/core/logging.py +406 -0
optexity/inference/core/run_assertion.py +55 -0
optexity/inference/core/run_automation.py +463 -0
optexity/inference/core/run_extraction.py +240 -0
optexity/inference/core/run_interaction.py +254 -0
optexity/inference/core/run_python_script.py +20 -0
optexity/inference/core/run_two_fa.py +120 -0
optexity/inference/core/two_factor_auth/__init__.py +0 -0
optexity/inference/infra/__init__.py +0 -0
optexity/inference/infra/browser.py +455 -0
optexity/inference/infra/browser_extension.py +20 -0
optexity/inference/models/__init__.py +22 -0
optexity/inference/models/gemini.py +113 -0
optexity/inference/models/human.py +20 -0
optexity/inference/models/llm_model.py +210 -0
optexity/inference/run_local.py +200 -0
optexity/schema/__init__.py +0 -0
optexity/schema/actions/__init__.py +0 -0
optexity/schema/actions/assertion_action.py +66 -0
optexity/schema/actions/extraction_action.py +143 -0
optexity/schema/actions/interaction_action.py +330 -0
optexity/schema/actions/misc_action.py +18 -0
optexity/schema/actions/prompts.py +27 -0
optexity/schema/actions/two_fa_action.py +24 -0
optexity/schema/automation.py +432 -0
optexity/schema/callback.py +16 -0
optexity/schema/inference.py +87 -0
optexity/schema/memory.py +100 -0
optexity/schema/task.py +212 -0
optexity/schema/token_usage.py +48 -0
optexity/utils/__init__.py +0 -0
optexity/utils/settings.py +54 -0
optexity/utils/utils.py +76 -0
{optexity-0.1.2.dist-info → optexity-0.1.3.dist-info}/METADATA +1 -1
optexity-0.1.3.dist-info/RECORD +80 -0
optexity-0.1.2.dist-info/RECORD +0 -11
{optexity-0.1.2.dist-info → optexity-0.1.3.dist-info}/WHEEL +0 -0
{optexity-0.1.2.dist-info → optexity-0.1.3.dist-info}/entry_points.txt +0 -0
{optexity-0.1.2.dist-info → optexity-0.1.3.dist-info}/licenses/LICENSE +0 -0
{optexity-0.1.2.dist-info → optexity-0.1.3.dist-info}/top_level.txt +0 -0

optexity/inference/core/run_assertion.py ADDED Viewed

@@ -0,0 +1,55 @@
+import logging
+from copy import deepcopy
+from optexity.inference.core.run_extraction import handle_llm_extraction
+from optexity.inference.infra.browser import Browser
+from optexity.inference.models import GeminiModels, get_llm_model
+from optexity.schema.actions.assertion_action import AssertionAction, LLMAssertion
+from optexity.schema.memory import Memory
+logger = logging.getLogger(__name__)
+llm_model = get_llm_model(GeminiModels.GEMINI_2_5_FLASH, True)
+async def run_assertion_action(
+    assertion_action: AssertionAction, memory: Memory, browser: Browser
+):
+    logger.debug(
+        f"---------Running assertion action {assertion_action.model_dump_json()}---------"
+    )
+    if assertion_action.llm:
+        await handle_llm_assertion(assertion_action.llm, memory, browser)
+    elif assertion_action.network_call:
+        raise ValueError("Network call assertions are not supported yet")
+        # await handle_network_call_assertion(
+        #     assertion_action.network_call, memory, browser
+        # )
+    elif assertion_action.python_script:
+        raise ValueError("Python script assertions are not supported yet")
+        # await handle_python_script_assertion(
+        #     assertion_action.python_script, memory, browser
+        # )
+async def handle_llm_assertion(
+    llm_assertion: LLMAssertion, memory: Memory, browser: Browser
+):
+    extra_instruction = """You are a helpful assistant that verifies if the condition is met.
+        Use the info supplied below to verify the condition.
+        The assertion_reason should be a short explanation of why the condition was met or not met.
+        The assertion_result should be True if the condition is met, False otherwise.
+        """
+    llm_assertion_new = deepcopy(llm_assertion)
+    llm_assertion_new.extraction_instructions = (
+        extra_instruction + "\n" + llm_assertion_new.extraction_instructions
+    )
+    output_data = await handle_llm_extraction(llm_assertion_new, memory, browser)
+    if output_data.json_data["assertion_result"]:
+        return True
+    else:
+        raise AssertionError(
+            f"Assertion failed on node {memory.automation_state.step_index}: {output_data.json_data['assertion_reason']}"
+        )

optexity/inference/core/run_automation.py ADDED Viewed

@@ -0,0 +1,463 @@
+import asyncio
+import logging
+import time
+import traceback
+from copy import deepcopy
+from patchright._impl._errors import TimeoutError as PatchrightTimeoutError
+from playwright._impl._errors import TimeoutError as PlaywrightTimeoutError
+from optexity.inference.core.interaction.utils import clean_download
+from optexity.inference.core.logging import (
+    complete_task_in_server,
+    delete_local_data,
+    initiate_callback,
+    save_downloads_in_server,
+    save_latest_memory_state_locally,
+    save_output_data_in_server,
+    save_trajectory_in_server,
+    start_task_in_server,
+)
+from optexity.inference.core.run_assertion import run_assertion_action
+from optexity.inference.core.run_extraction import run_extraction_action
+from optexity.inference.core.run_interaction import (
+    handle_download_url_as_pdf,
+    run_interaction_action,
+)
+from optexity.inference.core.run_python_script import run_python_script_action
+from optexity.inference.core.run_two_fa import run_two_fa_action
+from optexity.inference.infra.browser import Browser
+from optexity.schema.actions.interaction_action import DownloadUrlAsPdfAction
+from optexity.schema.automation import ActionNode, ForLoopNode, IfElseNode
+from optexity.schema.memory import BrowserState, ForLoopStatus, Memory, OutputData
+from optexity.schema.task import Task
+from optexity.utils.settings import settings
+logger = logging.getLogger(__name__)
+# TODO: static check that index for all replacement of input variables are within the bounds of the input variables
+# TODO: static check that all for loop expansion for generated variables have some place where generated variables are added to the memory
+# TODO: Check that all for loop expansion for generated variables have some place where generated variables are added to the memory
+# TODO: give a warning where any variable of type {variable_name[index]} is used but variable_name is not in the memory in generated variables or in input variables
+async def run_automation(task: Task, child_process_id: int):
+    file_handler = logging.FileHandler(str(task.log_file_path))
+    file_handler.setLevel(logging.DEBUG)
+    current_module = __name__.split(".")[0]  # top-level module/package
+    logging.getLogger(current_module).addHandler(file_handler)
+    logging.getLogger("browser_use").setLevel(logging.INFO)
+    logger.info(f"Task {task.task_id} started running")
+    memory = None
+    browser = None
+    try:
+        await start_task_in_server(task)
+        memory = Memory()
+        browser = Browser(
+            memory=memory,
+            headless=False,
+            channel=task.automation.browser_channel,
+            debug_port=9222 + child_process_id,
+            use_proxy=task.use_proxy,
+            proxy_session_id=task.proxy_session_id(
+                settings.PROXY_PROVIDER if task.use_proxy else None
+            ),
+        )
+        await browser.start()
+        automation = task.automation
+        memory.automation_state.step_index = -1
+        memory.automation_state.try_index = 0
+        if task.use_proxy:
+            await browser.go_to_url("https://ipinfo.io/json")
+            page = await browser.get_current_page()
+            ip_info = await page.evaluate(
+                """
+                async () => {
+                const res = await fetch("https://ipinfo.io/json");
+                return await res.json();
+                }
+                """
+            )
+            if isinstance(ip_info, dict):
+                memory.variables.output_data.append(
+                    OutputData(unique_identifier="ip_info", json_data=ip_info)
+                )
+            elif isinstance(ip_info, str):
+                memory.variables.output_data.append(
+                    OutputData(unique_identifier="ip_info", text=ip_info)
+                )
+            else:
+                try:
+                    memory.variables.output_data.append(
+                        OutputData(unique_identifier="ip_info", text=str(ip_info))
+                    )
+                except Exception as e:
+                    logger.error(f"Error getting IP info: {e}")
+        await browser.go_to_url(task.automation.url)
+        full_automation = []
+        for node in automation.nodes:
+            if isinstance(node, ForLoopNode):
+                await handle_for_loop_node(node, memory, task, browser, full_automation)
+            elif isinstance(node, IfElseNode):
+                await handle_if_else_node(node, memory, task, browser, full_automation)
+            else:
+                full_automation.append(node.model_dump())
+                await run_action_node(
+                    node,
+                    task,
+                    memory,
+                    browser,
+                )
+        task.status = "success"
+    except AssertionError as e:
+        logger.error(f"Assertion error: {e}")
+        task.error = str(e)
+        task.status = "failed"
+    except Exception as e:
+        logger.error(f"Error running automation: {traceback.format_exc()}")
+        task.error = str(e)
+        task.status = "failed"
+    finally:
+        if task and memory:
+            await run_final_downloads_check(task, memory, browser)
+        if memory and browser:
+            await run_final_logging(task, memory, browser, child_process_id)
+        if browser:
+            await browser.stop()
+    logger.info(f"Task {task.task_id} completed with status {task.status}")
+    logging.getLogger(current_module).removeHandler(file_handler)
+async def run_final_downloads_check(task: Task, memory: Memory, browser: Browser):
+    try:
+        logger.debug("Running final downloads check")
+        max_timeout = 10.0
+        start = time.monotonic()
+        await asyncio.wait_for(
+            browser.all_active_downloads_done.wait(), timeout=max_timeout
+        )
+        max_timeout = max(0.0, max_timeout - (time.monotonic() - start))
+        for temp_download_path, (
+            is_downloaded,
+            download,
+        ) in memory.raw_downloads.items():
+            if is_downloaded:
+                continue
+            download_path = task.downloads_directory / download.suggested_filename
+            await download.save_as(download_path)
+            memory.downloads.append(download_path)
+            await clean_download(download_path)
+            memory.raw_downloads[temp_download_path] = (True, download)
+        while max_timeout > 0:
+            if (
+                len(memory.urls_to_downloads) + len(memory.downloads)
+                >= task.automation.expected_downloads
+            ):
+                break
+            interval = min(1, max_timeout)
+            await asyncio.sleep(interval)
+            max_timeout = max(0.0, max_timeout - interval)
+        for url, filename in memory.urls_to_downloads:
+            download_path = task.downloads_directory / filename
+            await handle_download_url_as_pdf(
+                DownloadUrlAsPdfAction(url=url, download_filename=filename),
+                task,
+                memory,
+                browser,
+            )
+    except Exception as e:
+        logger.error(f"Error running final downloads check: {e}")
+    logger.warning(
+        f"Found {len(memory.downloads)} downloads, expected {task.automation.expected_downloads}"
+    )
+async def run_final_logging(
+    task: Task, memory: Memory, browser: Browser, child_process_id: int
+):
+    try:
+        await complete_task_in_server(task, memory.token_usage, child_process_id)
+        try:
+            memory.automation_state.step_index += 1
+            browser_state_summary = await browser.get_browser_state_summary()
+            memory.browser_states.append(
+                BrowserState(
+                    url=browser_state_summary.url,
+                    screenshot=browser_state_summary.screenshot,
+                    title=browser_state_summary.title,
+                    axtree=browser_state_summary.dom_state.llm_representation(),
+                )
+            )
+            memory.final_screenshot = await browser.get_screenshot(full_page=True)
+        except Exception as e:
+            logger.error(f"Error getting final screenshot: {e}")
+        await save_output_data_in_server(task, memory)
+        await save_downloads_in_server(task, memory)
+        await save_latest_memory_state_locally(task, memory, None)
+        await save_trajectory_in_server(task, memory)
+        await initiate_callback(task)
+        await delete_local_data(task)
+    except Exception as e:
+        logger.error(f"Error running final logging: {e}")
+async def run_action_node(
+    action_node: ActionNode,
+    task: Task,
+    memory: Memory,
+    browser: Browser,
+):
+    await asyncio.sleep(action_node.before_sleep_time)
+    await browser.handle_new_tabs(0)
+    memory.automation_state.step_index += 1
+    memory.automation_state.try_index = 0
+    await action_node.replace_variables(task.input_parameters)
+    await action_node.replace_variables(task.secure_parameters)
+    await action_node.replace_variables(memory.variables.generated_variables)
+    # ## TODO: optimize this by taking screenshot and axtree only if needed
+    # browser_state_summary = await browser.get_browser_state_summary()
+    memory.browser_states.append(
+        BrowserState(
+            url=await browser.get_current_page_url(),
+            screenshot=None,
+            title=await browser.get_current_page_title(),
+            axtree=None,
+        )
+    )
+    logger.debug(f"-----Running node {memory.automation_state.step_index}-----")
+    try:
+        if action_node.interaction_action:
+            ## Assuming network calls are only made during interaction actions and not during extraction actions
+            await browser.clear_network_calls()
+            await browser.attach_network_listeners()
+            await run_interaction_action(
+                action_node.interaction_action, task, memory, browser, 2
+            )
+        elif action_node.extraction_action:
+            await run_extraction_action(
+                action_node.extraction_action, memory, browser, task
+            )
+        elif action_node.two_fa_action:
+            await run_two_fa_action(action_node.two_fa_action, memory)
+        elif action_node.python_script_action:
+            await run_python_script_action(
+                action_node.python_script_action, memory, browser
+            )
+        elif action_node.assertion_action:
+            await run_assertion_action(action_node.assertion_action, memory, browser)
+    except Exception as e:
+        logger.error(f"Error running node {memory.automation_state.step_index}: {e}")
+        raise e
+    finally:
+        await save_latest_memory_state_locally(task, memory, action_node)
+    if action_node.expect_new_tab:
+        found_new_tab, total_time = await browser.handle_new_tabs(
+            action_node.max_new_tab_wait_time
+        )
+        if not found_new_tab:
+            logger.warning(
+                f"No new tab found after {action_node.max_new_tab_wait_time} seconds, even though expect_new_tab is True"
+            )
+        else:
+            logger.debug(f"Switched to new tab after {total_time} seconds, as expected")
+    else:
+        await sleep_for_page_to_load(browser, action_node.end_sleep_time)
+    logger.debug(f"-----Finished node {memory.automation_state.step_index}-----")
+async def sleep_for_page_to_load(browser: Browser, sleep_time: float):
+    await asyncio.sleep(0.1)
+    sleep_time = max(0.0, sleep_time - 0.1)
+    if float(sleep_time) == 0.0:
+        return
+    page = await browser.get_current_page()
+    if page is None:
+        return
+    try:
+        await page.wait_for_load_state("load", timeout=sleep_time * 1000)
+    except TimeoutError as e:
+        pass
+    except PatchrightTimeoutError as e:
+        pass
+    except PlaywrightTimeoutError as e:
+        pass
+def evaluate_condition(condition: str, memory: Memory, task: Task) -> bool:
+    return eval(
+        condition,
+        {},
+        {**task.input_parameters, **memory.variables.generated_variables},
+    )
+async def handle_if_else_node(
+    if_else_node: IfElseNode,
+    memory: Memory,
+    task: Task,
+    browser: Browser,
+    full_automation: list[ActionNode],
+):
+    logger.debug(
+        f"Handling if else node {if_else_node.condition} with if nodes {if_else_node.if_nodes} and else nodes {if_else_node.else_nodes}"
+    )
+    condition_result = evaluate_condition(if_else_node.condition, memory, task)
+    if condition_result:
+        nodes = if_else_node.if_nodes
+    else:
+        nodes = if_else_node.else_nodes
+    for node in nodes:
+        if isinstance(node, ActionNode):
+            full_automation.append(node.model_dump())
+            await run_action_node(
+                node,
+                task,
+                memory,
+                browser,
+            )
+        elif isinstance(node, IfElseNode):
+            await handle_if_else_node(node, memory, task, browser, full_automation)
+        elif isinstance(node, ForLoopNode):
+            await handle_for_loop_node(node, memory, task, browser, full_automation)
+    logger.debug(f"Finished handling if else node {if_else_node.condition}")
+async def handle_for_loop_node(
+    for_loop_node: ForLoopNode,
+    memory: Memory,
+    task: Task,
+    browser: Browser,
+    full_automation: list[ActionNode],
+):
+    if for_loop_node.variable_name in task.input_parameters:
+        values = task.input_parameters[for_loop_node.variable_name]
+    elif for_loop_node.variable_name in memory.variables.generated_variables:
+        values = memory.variables.generated_variables[for_loop_node.variable_name]
+    else:
+        raise ValueError(
+            f"Variable name {for_loop_node.variable_name} not found in input variables or generated variables"
+        )
+    memory.variables.for_loop_status.append([])
+    for index in range(len(values)):
+        try:
+            for node in for_loop_node.nodes:
+                new_node = deepcopy(node)
+                new_node.replace(
+                    f"{{{for_loop_node.variable_name}[index]}}",
+                    f"{{{for_loop_node.variable_name}[{index}]}}",
+                )
+                new_node.replace(
+                    f"{{index_of({for_loop_node.variable_name})}}", f"{index}"
+                )
+                if isinstance(new_node, IfElseNode):
+                    await handle_if_else_node(
+                        new_node, memory, task, browser, full_automation
+                    )
+                else:
+                    full_automation.append(new_node.model_dump())
+                    await run_action_node(
+                        new_node,
+                        task,
+                        memory,
+                        browser,
+                    )
+            memory.variables.for_loop_status[-1].append(
+                ForLoopStatus(
+                    variable_name=for_loop_node.variable_name,
+                    index=index,
+                    value=values[index],
+                    status="success",
+                )
+            )
+        except Exception as e:
+            logger.error(
+                f"Error running for loop node {for_loop_node.variable_name}: {e}"
+            )
+            memory.variables.for_loop_status[-1].append(
+                ForLoopStatus(
+                    variable_name=for_loop_node.variable_name,
+                    index=index,
+                    value=values[index],
+                    status="error",
+                    error=str(e),
+                )
+            )
+            if for_loop_node.on_error_in_loop == "continue":
+                continue
+            elif for_loop_node.on_error_in_loop == "break":
+                for index2 in range(index + 1, len(values)):
+                    memory.variables.for_loop_status[-1].append(
+                        ForLoopStatus(
+                            variable_name=for_loop_node.variable_name,
+                            index=index2,
+                            value=values[index2],
+                            status="skipped",
+                        )
+                    )
+                break
+            else:
+                raise e
+        if index < len(values) - 1:
+            for node in for_loop_node.reset_nodes:
+                if isinstance(node, IfElseNode):
+                    await handle_if_else_node(
+                        node, memory, task, browser, full_automation
+                    )
+                else:
+                    full_automation.append(node.model_dump())
+                    await run_action_node(
+                        node,
+                        task,
+                        memory,
+                        browser,
+                    )

optexity 0.1.2__py3-none-any.whl → 0.1.3__py3-none-any.whl

optexity 0.1.2py3-none-any.whl → 0.1.3py3-none-any.whl