PyPI - minitap-mobile-use - Versions diffs - 3.3.0__py3-none-any.whl - Mend

minitap-mobile-use 3.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (115) hide show

minitap/mobile_use/__init__.py +0 -0
minitap/mobile_use/agents/contextor/contextor.md +55 -0
minitap/mobile_use/agents/contextor/contextor.py +175 -0
minitap/mobile_use/agents/contextor/types.py +36 -0
minitap/mobile_use/agents/cortex/cortex.md +135 -0
minitap/mobile_use/agents/cortex/cortex.py +152 -0
minitap/mobile_use/agents/cortex/types.py +15 -0
minitap/mobile_use/agents/executor/executor.md +42 -0
minitap/mobile_use/agents/executor/executor.py +87 -0
minitap/mobile_use/agents/executor/tool_node.py +152 -0
minitap/mobile_use/agents/hopper/hopper.md +15 -0
minitap/mobile_use/agents/hopper/hopper.py +44 -0
minitap/mobile_use/agents/orchestrator/human.md +12 -0
minitap/mobile_use/agents/orchestrator/orchestrator.md +21 -0
minitap/mobile_use/agents/orchestrator/orchestrator.py +134 -0
minitap/mobile_use/agents/orchestrator/types.py +11 -0
minitap/mobile_use/agents/outputter/human.md +25 -0
minitap/mobile_use/agents/outputter/outputter.py +85 -0
minitap/mobile_use/agents/outputter/test_outputter.py +167 -0
minitap/mobile_use/agents/planner/human.md +14 -0
minitap/mobile_use/agents/planner/planner.md +126 -0
minitap/mobile_use/agents/planner/planner.py +101 -0
minitap/mobile_use/agents/planner/types.py +51 -0
minitap/mobile_use/agents/planner/utils.py +70 -0
minitap/mobile_use/agents/summarizer/summarizer.py +35 -0
minitap/mobile_use/agents/video_analyzer/__init__.py +5 -0
minitap/mobile_use/agents/video_analyzer/human.md +5 -0
minitap/mobile_use/agents/video_analyzer/video_analyzer.md +37 -0
minitap/mobile_use/agents/video_analyzer/video_analyzer.py +111 -0
minitap/mobile_use/clients/browserstack_client.py +477 -0
minitap/mobile_use/clients/idb_client.py +429 -0
minitap/mobile_use/clients/ios_client.py +332 -0
minitap/mobile_use/clients/ios_client_config.py +141 -0
minitap/mobile_use/clients/ui_automator_client.py +330 -0
minitap/mobile_use/clients/wda_client.py +526 -0
minitap/mobile_use/clients/wda_lifecycle.py +367 -0
minitap/mobile_use/config.py +413 -0
minitap/mobile_use/constants.py +3 -0
minitap/mobile_use/context.py +106 -0
minitap/mobile_use/controllers/__init__.py +0 -0
minitap/mobile_use/controllers/android_controller.py +524 -0
minitap/mobile_use/controllers/controller_factory.py +46 -0
minitap/mobile_use/controllers/device_controller.py +182 -0
minitap/mobile_use/controllers/ios_controller.py +436 -0
minitap/mobile_use/controllers/platform_specific_commands_controller.py +199 -0
minitap/mobile_use/controllers/types.py +106 -0
minitap/mobile_use/controllers/unified_controller.py +193 -0
minitap/mobile_use/graph/graph.py +160 -0
minitap/mobile_use/graph/state.py +115 -0
minitap/mobile_use/main.py +309 -0
minitap/mobile_use/sdk/__init__.py +12 -0
minitap/mobile_use/sdk/agent.py +1294 -0
minitap/mobile_use/sdk/builders/__init__.py +10 -0
minitap/mobile_use/sdk/builders/agent_config_builder.py +307 -0
minitap/mobile_use/sdk/builders/index.py +15 -0
minitap/mobile_use/sdk/builders/task_request_builder.py +236 -0
minitap/mobile_use/sdk/constants.py +1 -0
minitap/mobile_use/sdk/examples/README.md +83 -0
minitap/mobile_use/sdk/examples/__init__.py +1 -0
minitap/mobile_use/sdk/examples/app_lock_messaging.py +54 -0
minitap/mobile_use/sdk/examples/platform_manual_task_example.py +67 -0
minitap/mobile_use/sdk/examples/platform_minimal_example.py +48 -0
minitap/mobile_use/sdk/examples/simple_photo_organizer.py +76 -0
minitap/mobile_use/sdk/examples/smart_notification_assistant.py +225 -0
minitap/mobile_use/sdk/examples/video_transcription_example.py +117 -0
minitap/mobile_use/sdk/services/cloud_mobile.py +656 -0
minitap/mobile_use/sdk/services/platform.py +434 -0
minitap/mobile_use/sdk/types/__init__.py +51 -0
minitap/mobile_use/sdk/types/agent.py +84 -0
minitap/mobile_use/sdk/types/exceptions.py +138 -0
minitap/mobile_use/sdk/types/platform.py +183 -0
minitap/mobile_use/sdk/types/task.py +269 -0
minitap/mobile_use/sdk/utils.py +29 -0
minitap/mobile_use/services/accessibility.py +100 -0
minitap/mobile_use/services/llm.py +247 -0
minitap/mobile_use/services/telemetry.py +421 -0
minitap/mobile_use/tools/index.py +67 -0
minitap/mobile_use/tools/mobile/back.py +52 -0
minitap/mobile_use/tools/mobile/erase_one_char.py +56 -0
minitap/mobile_use/tools/mobile/focus_and_clear_text.py +317 -0
minitap/mobile_use/tools/mobile/focus_and_input_text.py +153 -0
minitap/mobile_use/tools/mobile/launch_app.py +86 -0
minitap/mobile_use/tools/mobile/long_press_on.py +169 -0
minitap/mobile_use/tools/mobile/open_link.py +62 -0
minitap/mobile_use/tools/mobile/press_key.py +83 -0
minitap/mobile_use/tools/mobile/stop_app.py +62 -0
minitap/mobile_use/tools/mobile/swipe.py +156 -0
minitap/mobile_use/tools/mobile/tap.py +154 -0
minitap/mobile_use/tools/mobile/video_recording.py +177 -0
minitap/mobile_use/tools/mobile/wait_for_delay.py +81 -0
minitap/mobile_use/tools/scratchpad.py +147 -0
minitap/mobile_use/tools/test_utils.py +413 -0
minitap/mobile_use/tools/tool_wrapper.py +16 -0
minitap/mobile_use/tools/types.py +35 -0
minitap/mobile_use/tools/utils.py +336 -0
minitap/mobile_use/utils/app_launch_utils.py +173 -0
minitap/mobile_use/utils/cli_helpers.py +37 -0
minitap/mobile_use/utils/cli_selection.py +143 -0
minitap/mobile_use/utils/conversations.py +31 -0
minitap/mobile_use/utils/decorators.py +124 -0
minitap/mobile_use/utils/errors.py +6 -0
minitap/mobile_use/utils/file.py +13 -0
minitap/mobile_use/utils/logger.py +183 -0
minitap/mobile_use/utils/media.py +186 -0
minitap/mobile_use/utils/recorder.py +52 -0
minitap/mobile_use/utils/requests_utils.py +37 -0
minitap/mobile_use/utils/shell_utils.py +20 -0
minitap/mobile_use/utils/test_ui_hierarchy.py +178 -0
minitap/mobile_use/utils/time.py +6 -0
minitap/mobile_use/utils/ui_hierarchy.py +132 -0
minitap/mobile_use/utils/video.py +281 -0
minitap_mobile_use-3.3.0.dist-info/METADATA +329 -0
minitap_mobile_use-3.3.0.dist-info/RECORD +115 -0
minitap_mobile_use-3.3.0.dist-info/WHEEL +4 -0
minitap_mobile_use-3.3.0.dist-info/entry_points.txt +3 -0

minitap/mobile_use/tools/mobile/video_recording.py ADDED Viewed

@@ -0,0 +1,177 @@
+"""
+Video recording tools for mobile devices.
+Provides start/stop video recording tools that delegate to platform-specific
+controllers (AndroidDeviceController, iOSDeviceController).
+"""
+import shutil
+from typing import Annotated
+from langchain_core.messages import ToolMessage
+from langchain_core.tools import tool
+from langchain_core.tools.base import BaseTool, InjectedToolCallId
+from langgraph.prebuilt import InjectedState
+from langgraph.types import Command
+from minitap.mobile_use.constants import EXECUTOR_MESSAGES_KEY
+from minitap.mobile_use.context import DevicePlatform, MobileUseContext
+from minitap.mobile_use.controllers.controller_factory import get_controller
+from minitap.mobile_use.graph.state import State
+from minitap.mobile_use.tools.tool_wrapper import ToolWrapper
+from minitap.mobile_use.utils.logger import get_logger
+from minitap.mobile_use.utils.video import DEFAULT_MAX_DURATION_SECONDS
+logger = get_logger(__name__)
+def get_start_video_recording_tool(ctx: MobileUseContext) -> BaseTool:
+    @tool
+    async def start_video_recording(
+        agent_thought: str,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+    ):
+        """
+        Starts a background screen recording on the mobile device.
+        Recording continues until stop_video_recording is called.
+        Max duration: 3 min (Android) / 15 min (iOS). Audio is not captured.
+        """
+        platform = ctx.device.mobile_platform
+        controller = get_controller(ctx)
+        if platform in (DevicePlatform.ANDROID, DevicePlatform.IOS):
+            result = await controller.start_video_recording(DEFAULT_MAX_DURATION_SECONDS)
+        else:
+            from minitap.mobile_use.utils.video import VideoRecordingResult
+            result = VideoRecordingResult(
+                success=False,
+                message=f"Unsupported platform: {platform}",
+            )
+        if result.success:
+            agent_outcome = start_video_recording_wrapper.on_success_fn(result.message)
+        else:
+            agent_outcome = start_video_recording_wrapper.on_failure_fn(result.message)
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            status="success" if result.success else "error",
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                },
+                agent="executor",
+            ),
+        )
+    return start_video_recording
+def get_stop_video_recording_tool(ctx: MobileUseContext) -> BaseTool:
+    from minitap.mobile_use.agents.video_analyzer.video_analyzer import analyze_video
+    @tool
+    async def stop_video_recording(
+        agent_thought: str,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+        prompt: str = "Describe what happened in the video.",
+    ):
+        """
+        Stops the current screen recording and analyzes the video content.
+        Use `prompt` to specify what to extract (e.g., "What happens after each 10s of the video?").
+        """
+        platform = ctx.device.mobile_platform
+        controller = get_controller(ctx)
+        if platform in (DevicePlatform.ANDROID, DevicePlatform.IOS):
+            result = await controller.stop_video_recording()
+        else:
+            from minitap.mobile_use.utils.video import VideoRecordingResult
+            result = VideoRecordingResult(
+                success=False,
+                message=f"Unsupported platform: {platform}",
+            )
+        if not result.success or result.video_path is None:
+            agent_outcome = stop_video_recording_wrapper.on_failure_fn(result.message)
+            tool_message = ToolMessage(
+                tool_call_id=tool_call_id,
+                content=agent_outcome,
+                status="error",
+            )
+            return Command(
+                update=await state.asanitize_update(
+                    ctx=ctx,
+                    update={
+                        "agents_thoughts": [agent_thought, agent_outcome],
+                        EXECUTOR_MESSAGES_KEY: [tool_message],
+                    },
+                    agent="executor",
+                ),
+            )
+        video_path = result.video_path
+        try:
+            analysis_result = await analyze_video(
+                ctx=ctx,
+                video_path=video_path,
+                prompt=prompt,
+            )
+            agent_outcome = stop_video_recording_wrapper.on_success_fn(analysis_result)
+            status = "success"
+        except Exception as e:
+            logger.error(f"Video analysis failed: {e}")
+            agent_outcome = stop_video_recording_wrapper.on_failure_fn(
+                f"Recording stopped but analysis failed: {e}"
+            )
+            status = "error"
+        finally:
+            try:
+                if video_path and video_path.exists():
+                    video_path.unlink()
+                    if video_path.parent.exists():
+                        shutil.rmtree(video_path.parent)
+            except Exception:
+                pass
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            status=status,
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                },
+                agent="executor",
+            ),
+        )
+    return stop_video_recording
+start_video_recording_wrapper = ToolWrapper(
+    tool_fn_getter=get_start_video_recording_tool,
+    on_success_fn=lambda message: f"Video recording started successfully. {message}",
+    on_failure_fn=lambda message: f"Failed to start video recording: {message}",
+)
+stop_video_recording_wrapper = ToolWrapper(
+    tool_fn_getter=get_stop_video_recording_tool,
+    on_success_fn=lambda analysis: f"Video stopped successfully. Analysis result:\n{analysis}",
+    on_failure_fn=lambda message: f"Video recording/analysis failed: {message}",
+)

minitap/mobile_use/tools/mobile/wait_for_delay.py ADDED Viewed

@@ -0,0 +1,81 @@
+import time
+from typing import Annotated
+from langchain_core.messages import ToolMessage
+from langchain_core.tools import tool
+from langchain_core.tools.base import InjectedToolCallId
+from langgraph.prebuilt import InjectedState
+from langgraph.types import Command
+from minitap.mobile_use.constants import EXECUTOR_MESSAGES_KEY
+from minitap.mobile_use.context import MobileUseContext
+from minitap.mobile_use.graph.state import State
+from minitap.mobile_use.tools.tool_wrapper import ToolWrapper
+MAX_DELAY_MS = 60000
+def get_wait_for_delay_tool(ctx: MobileUseContext):
+    @tool
+    async def wait_for_delay(
+        agent_thought: str,
+        time_in_ms: int,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+    ) -> Command:
+        """
+        Wait for a delay in milliseconds.
+        This tool pauses execution for a specified number of milliseconds.
+        Use this when you need to introduce a controlled delay to allow the UI
+        to update after an action, regardless of whether an animation is playing.
+        Args:
+            time_in_ms: The number of milliseconds to wait. (capped at 60 seconds)
+        Example:
+            - wait_for_delay with time_in_ms=1000 (waits 1 second)
+            - wait_for_delay with time_in_ms=500 (waits 0.5 seconds)
+        """
+        if time_in_ms < 0:
+            time_in_ms = 1000
+        if time_in_ms > MAX_DELAY_MS:
+            time_in_ms = MAX_DELAY_MS
+        try:
+            time.sleep(time_in_ms / 1000)
+            output = None
+            has_failed = False
+        except Exception as e:
+            output = str(e)
+            has_failed = True
+        agent_outcome = (
+            wait_for_delay_wrapper.on_failure_fn()
+            if has_failed
+            else wait_for_delay_wrapper.on_success_fn(time_in_ms)
+        )
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            additional_kwargs={"error": output} if has_failed else {},
+            status="error" if has_failed else "success",
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                },
+                agent="executor",
+            ),
+        )
+    return wait_for_delay
+wait_for_delay_wrapper = ToolWrapper(
+    tool_fn_getter=get_wait_for_delay_tool,
+    on_success_fn=lambda delay: f"Successfully waited for {delay} milliseconds.",
+    on_failure_fn=lambda: "Failed to wait for delay.",
+)

minitap/mobile_use/tools/scratchpad.py ADDED Viewed

@@ -0,0 +1,147 @@
+from typing import Annotated
+from langchain_core.messages import ToolMessage
+from langchain_core.tools import tool
+from langchain_core.tools.base import BaseTool, InjectedToolCallId
+from langgraph.prebuilt import InjectedState
+from langgraph.types import Command
+from minitap.mobile_use.constants import EXECUTOR_MESSAGES_KEY
+from minitap.mobile_use.context import MobileUseContext
+from minitap.mobile_use.graph.state import State
+from minitap.mobile_use.tools.tool_wrapper import ToolWrapper
+from minitap.mobile_use.utils.logger import get_logger
+logger = get_logger(__name__)
+def get_save_note_tool(ctx: MobileUseContext) -> BaseTool:
+    @tool
+    async def save_note(
+        agent_thought: str,
+        key: str,
+        content: str,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+    ):
+        """
+        Saves a text note to persistent memory with the given key.
+        If the key already exists, it will be overwritten.
+        """
+        updated_scratchpad = {**state.scratchpad, key: content}
+        agent_outcome = save_note_wrapper.on_success_fn(key)
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            status="success",
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                    "scratchpad": updated_scratchpad,
+                },
+                agent="executor",
+            ),
+        )
+    return save_note
+def get_read_note_tool(ctx: MobileUseContext) -> BaseTool:
+    @tool
+    async def read_note(
+        agent_thought: str,
+        key: str,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+    ):
+        """
+        Reads a previously saved note from persistent memory by its key.
+        """
+        content = state.scratchpad.get(key)
+        if content is not None:
+            agent_outcome = read_note_wrapper.on_success_fn(key, content)
+            status = "success"
+        else:
+            agent_outcome = read_note_wrapper.on_failure_fn(key)
+            status = "error"
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            status=status,
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                },
+                agent="executor",
+            ),
+        )
+    return read_note
+def get_list_notes_tool(ctx: MobileUseContext) -> BaseTool:
+    @tool
+    async def list_notes(
+        agent_thought: str,
+        tool_call_id: Annotated[str, InjectedToolCallId],
+        state: Annotated[State, InjectedState],
+    ):
+        """
+        Lists all note keys currently stored in persistent memory.
+        """
+        keys = list(state.scratchpad.keys())
+        agent_outcome = list_notes_wrapper.on_success_fn(keys)
+        tool_message = ToolMessage(
+            tool_call_id=tool_call_id,
+            content=agent_outcome,
+            status="success",
+        )
+        return Command(
+            update=await state.asanitize_update(
+                ctx=ctx,
+                update={
+                    "agents_thoughts": [agent_thought, agent_outcome],
+                    EXECUTOR_MESSAGES_KEY: [tool_message],
+                },
+                agent="executor",
+            ),
+        )
+    return list_notes
+save_note_wrapper = ToolWrapper(
+    tool_fn_getter=get_save_note_tool,
+    on_success_fn=lambda key: (f"Successfully saved note '{key}'."),
+    on_failure_fn=lambda key: f"Failed to save note '{key}'.",
+)
+read_note_wrapper = ToolWrapper(
+    tool_fn_getter=get_read_note_tool,
+    on_success_fn=lambda key, content: (
+        f"Successfully read note '{key}'. '{key}' note full content: {content}"
+    ),
+    on_failure_fn=lambda key: f"Note '{key}' not found in scratchpad.",
+)
+list_notes_wrapper = ToolWrapper(
+    tool_fn_getter=get_list_notes_tool,
+    on_success_fn=lambda keys: (
+        f"Here are all the note keys: {keys}" if keys else "No notes saved yet."
+    ),
+    on_failure_fn=lambda: "Failed to list notes.",
+)