PyPI - optexity-browser-use - Versions diffs - 0.9.5__py3-none-any.whl - Mend

optexity-browser-use 0.9.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (147) hide show

browser_use/__init__.py +157 -0
browser_use/actor/__init__.py +11 -0
browser_use/actor/element.py +1175 -0
browser_use/actor/mouse.py +134 -0
browser_use/actor/page.py +561 -0
browser_use/actor/playground/flights.py +41 -0
browser_use/actor/playground/mixed_automation.py +54 -0
browser_use/actor/playground/playground.py +236 -0
browser_use/actor/utils.py +176 -0
browser_use/agent/cloud_events.py +282 -0
browser_use/agent/gif.py +424 -0
browser_use/agent/judge.py +170 -0
browser_use/agent/message_manager/service.py +473 -0
browser_use/agent/message_manager/utils.py +52 -0
browser_use/agent/message_manager/views.py +98 -0
browser_use/agent/prompts.py +413 -0
browser_use/agent/service.py +2316 -0
browser_use/agent/system_prompt.md +185 -0
browser_use/agent/system_prompt_flash.md +10 -0
browser_use/agent/system_prompt_no_thinking.md +183 -0
browser_use/agent/views.py +743 -0
browser_use/browser/__init__.py +41 -0
browser_use/browser/cloud/cloud.py +203 -0
browser_use/browser/cloud/views.py +89 -0
browser_use/browser/events.py +578 -0
browser_use/browser/profile.py +1158 -0
browser_use/browser/python_highlights.py +548 -0
browser_use/browser/session.py +3225 -0
browser_use/browser/session_manager.py +399 -0
browser_use/browser/video_recorder.py +162 -0
browser_use/browser/views.py +200 -0
browser_use/browser/watchdog_base.py +260 -0
browser_use/browser/watchdogs/__init__.py +0 -0
browser_use/browser/watchdogs/aboutblank_watchdog.py +253 -0
browser_use/browser/watchdogs/crash_watchdog.py +335 -0
browser_use/browser/watchdogs/default_action_watchdog.py +2729 -0
browser_use/browser/watchdogs/dom_watchdog.py +817 -0
browser_use/browser/watchdogs/downloads_watchdog.py +1277 -0
browser_use/browser/watchdogs/local_browser_watchdog.py +461 -0
browser_use/browser/watchdogs/permissions_watchdog.py +43 -0
browser_use/browser/watchdogs/popups_watchdog.py +143 -0
browser_use/browser/watchdogs/recording_watchdog.py +126 -0
browser_use/browser/watchdogs/screenshot_watchdog.py +62 -0
browser_use/browser/watchdogs/security_watchdog.py +280 -0
browser_use/browser/watchdogs/storage_state_watchdog.py +335 -0
browser_use/cli.py +2359 -0
browser_use/code_use/__init__.py +16 -0
browser_use/code_use/formatting.py +192 -0
browser_use/code_use/namespace.py +665 -0
browser_use/code_use/notebook_export.py +276 -0
browser_use/code_use/service.py +1340 -0
browser_use/code_use/system_prompt.md +574 -0
browser_use/code_use/utils.py +150 -0
browser_use/code_use/views.py +171 -0
browser_use/config.py +505 -0
browser_use/controller/__init__.py +3 -0
browser_use/dom/enhanced_snapshot.py +161 -0
browser_use/dom/markdown_extractor.py +169 -0
browser_use/dom/playground/extraction.py +312 -0
browser_use/dom/playground/multi_act.py +32 -0
browser_use/dom/serializer/clickable_elements.py +200 -0
browser_use/dom/serializer/code_use_serializer.py +287 -0
browser_use/dom/serializer/eval_serializer.py +478 -0
browser_use/dom/serializer/html_serializer.py +212 -0
browser_use/dom/serializer/paint_order.py +197 -0
browser_use/dom/serializer/serializer.py +1170 -0
browser_use/dom/service.py +825 -0
browser_use/dom/utils.py +129 -0
browser_use/dom/views.py +906 -0
browser_use/exceptions.py +5 -0
browser_use/filesystem/__init__.py +0 -0
browser_use/filesystem/file_system.py +619 -0
browser_use/init_cmd.py +376 -0
browser_use/integrations/gmail/__init__.py +24 -0
browser_use/integrations/gmail/actions.py +115 -0
browser_use/integrations/gmail/service.py +225 -0
browser_use/llm/__init__.py +155 -0
browser_use/llm/anthropic/chat.py +242 -0
browser_use/llm/anthropic/serializer.py +312 -0
browser_use/llm/aws/__init__.py +36 -0
browser_use/llm/aws/chat_anthropic.py +242 -0
browser_use/llm/aws/chat_bedrock.py +289 -0
browser_use/llm/aws/serializer.py +257 -0
browser_use/llm/azure/chat.py +91 -0
browser_use/llm/base.py +57 -0
browser_use/llm/browser_use/__init__.py +3 -0
browser_use/llm/browser_use/chat.py +201 -0
browser_use/llm/cerebras/chat.py +193 -0
browser_use/llm/cerebras/serializer.py +109 -0
browser_use/llm/deepseek/chat.py +212 -0
browser_use/llm/deepseek/serializer.py +109 -0
browser_use/llm/exceptions.py +29 -0
browser_use/llm/google/__init__.py +3 -0
browser_use/llm/google/chat.py +542 -0
browser_use/llm/google/serializer.py +120 -0
browser_use/llm/groq/chat.py +229 -0
browser_use/llm/groq/parser.py +158 -0
browser_use/llm/groq/serializer.py +159 -0
browser_use/llm/messages.py +238 -0
browser_use/llm/models.py +271 -0
browser_use/llm/oci_raw/__init__.py +10 -0
browser_use/llm/oci_raw/chat.py +443 -0
browser_use/llm/oci_raw/serializer.py +229 -0
browser_use/llm/ollama/chat.py +97 -0
browser_use/llm/ollama/serializer.py +143 -0
browser_use/llm/openai/chat.py +264 -0
browser_use/llm/openai/like.py +15 -0
browser_use/llm/openai/serializer.py +165 -0
browser_use/llm/openrouter/chat.py +211 -0
browser_use/llm/openrouter/serializer.py +26 -0
browser_use/llm/schema.py +176 -0
browser_use/llm/views.py +48 -0
browser_use/logging_config.py +330 -0
browser_use/mcp/__init__.py +18 -0
browser_use/mcp/__main__.py +12 -0
browser_use/mcp/client.py +544 -0
browser_use/mcp/controller.py +264 -0
browser_use/mcp/server.py +1114 -0
browser_use/observability.py +204 -0
browser_use/py.typed +0 -0
browser_use/sandbox/__init__.py +41 -0
browser_use/sandbox/sandbox.py +637 -0
browser_use/sandbox/views.py +132 -0
browser_use/screenshots/__init__.py +1 -0
browser_use/screenshots/service.py +52 -0
browser_use/sync/__init__.py +6 -0
browser_use/sync/auth.py +357 -0
browser_use/sync/service.py +161 -0
browser_use/telemetry/__init__.py +51 -0
browser_use/telemetry/service.py +112 -0
browser_use/telemetry/views.py +101 -0
browser_use/tokens/__init__.py +0 -0
browser_use/tokens/custom_pricing.py +24 -0
browser_use/tokens/mappings.py +4 -0
browser_use/tokens/service.py +580 -0
browser_use/tokens/views.py +108 -0
browser_use/tools/registry/service.py +572 -0
browser_use/tools/registry/views.py +174 -0
browser_use/tools/service.py +1675 -0
browser_use/tools/utils.py +82 -0
browser_use/tools/views.py +100 -0
browser_use/utils.py +670 -0
optexity_browser_use-0.9.5.dist-info/METADATA +344 -0
optexity_browser_use-0.9.5.dist-info/RECORD +147 -0
optexity_browser_use-0.9.5.dist-info/WHEEL +4 -0
optexity_browser_use-0.9.5.dist-info/entry_points.txt +3 -0
optexity_browser_use-0.9.5.dist-info/licenses/LICENSE +21 -0

browser_use/mcp/client.py ADDED Viewed

@@ -0,0 +1,544 @@
+"""MCP (Model Context Protocol) client integration for browser-use.
+This module provides integration between external MCP servers and browser-use's action registry.
+MCP tools are dynamically discovered and registered as browser-use actions.
+Example usage:
+    from browser_use import Tools
+    from browser_use.mcp.client import MCPClient
+    tools = Tools()
+    # Connect to an MCP server
+    mcp_client = MCPClient(
+        server_name="my-server",
+        command="npx",
+        args=["@mycompany/mcp-server@latest"]
+    )
+    # Register all MCP tools as browser-use actions
+    await mcp_client.register_to_tools(tools)
+    # Now use with Agent as normal - MCP tools are available as actions
+"""
+import asyncio
+import logging
+import time
+from typing import Any
+from pydantic import BaseModel, ConfigDict, Field, create_model
+from browser_use.agent.views import ActionResult
+from browser_use.telemetry import MCPClientTelemetryEvent, ProductTelemetry
+from browser_use.tools.registry.service import Registry
+from browser_use.tools.service import Tools
+from browser_use.utils import get_browser_use_version
+logger = logging.getLogger(__name__)
+# Import MCP SDK
+from mcp import ClientSession, StdioServerParameters, types
+from mcp.client.stdio import stdio_client
+MCP_AVAILABLE = True
+class MCPClient:
+	"""Client for connecting to MCP servers and exposing their tools as browser-use actions."""
+	def __init__(
+		self,
+		server_name: str,
+		command: str,
+		args: list[str] | None = None,
+		env: dict[str, str] | None = None,
+	):
+		"""Initialize MCP client.
+		Args:
+			server_name: Name of the MCP server (for logging and identification)
+			command: Command to start the MCP server (e.g., "npx", "python")
+			args: Arguments for the command (e.g., ["@playwright/mcp@latest"])
+			env: Environment variables for the server process
+		"""
+		self.server_name = server_name
+		self.command = command
+		self.args = args or []
+		self.env = env
+		self.session: ClientSession | None = None
+		self._stdio_task = None
+		self._read_stream = None
+		self._write_stream = None
+		self._tools: dict[str, types.Tool] = {}
+		self._registered_actions: set[str] = set()
+		self._connected = False
+		self._disconnect_event = asyncio.Event()
+		self._telemetry = ProductTelemetry()
+	async def connect(self) -> None:
+		"""Connect to the MCP server and discover available tools."""
+		if self._connected:
+			logger.debug(f'Already connected to {self.server_name}')
+			return
+		start_time = time.time()
+		error_msg = None
+		try:
+			logger.info(f"🔌 Connecting to MCP server '{self.server_name}': {self.command} {' '.join(self.args)}")
+			# Create server parameters
+			server_params = StdioServerParameters(command=self.command, args=self.args, env=self.env)
+			# Start stdio client in background task
+			self._stdio_task = asyncio.create_task(self._run_stdio_client(server_params))
+			# Wait for connection to be established
+			retries = 0
+			max_retries = 100  # 10 second timeout (increased for parallel test execution)
+			while not self._connected and retries < max_retries:
+				await asyncio.sleep(0.1)
+				retries += 1
+			if not self._connected:
+				error_msg = f"Failed to connect to MCP server '{self.server_name}' after {max_retries * 0.1} seconds"
+				raise RuntimeError(error_msg)
+			logger.info(f"📦 Discovered {len(self._tools)} tools from '{self.server_name}': {list(self._tools.keys())}")
+		except Exception as e:
+			error_msg = str(e)
+			raise
+		finally:
+			# Capture telemetry for connect action
+			duration = time.time() - start_time
+			self._telemetry.capture(
+				MCPClientTelemetryEvent(
+					server_name=self.server_name,
+					command=self.command,
+					tools_discovered=len(self._tools),
+					version=get_browser_use_version(),
+					action='connect',
+					duration_seconds=duration,
+					error_message=error_msg,
+				)
+			)
+	async def _run_stdio_client(self, server_params: StdioServerParameters):
+		"""Run the stdio client connection in a background task."""
+		try:
+			async with stdio_client(server_params) as (read_stream, write_stream):
+				self._read_stream = read_stream
+				self._write_stream = write_stream
+				# Create and initialize session
+				async with ClientSession(read_stream, write_stream) as session:
+					self.session = session
+					# Initialize the connection
+					await session.initialize()
+					# Discover available tools
+					tools_response = await session.list_tools()
+					self._tools = {tool.name: tool for tool in tools_response.tools}
+					# Mark as connected
+					self._connected = True
+					# Keep the connection alive until disconnect is called
+					await self._disconnect_event.wait()
+		except Exception as e:
+			logger.error(f'MCP server connection error: {e}')
+			self._connected = False
+			raise
+		finally:
+			self._connected = False
+			self.session = None
+	async def disconnect(self) -> None:
+		"""Disconnect from the MCP server."""
+		if not self._connected:
+			return
+		start_time = time.time()
+		error_msg = None
+		try:
+			logger.info(f"🔌 Disconnecting from MCP server '{self.server_name}'")
+			# Signal disconnect
+			self._connected = False
+			self._disconnect_event.set()
+			# Wait for stdio task to finish
+			if self._stdio_task:
+				try:
+					await asyncio.wait_for(self._stdio_task, timeout=2.0)
+				except TimeoutError:
+					logger.warning(f"Timeout waiting for MCP server '{self.server_name}' to disconnect")
+					self._stdio_task.cancel()
+					try:
+						await self._stdio_task
+					except asyncio.CancelledError:
+						pass
+			self._tools.clear()
+			self._registered_actions.clear()
+		except Exception as e:
+			error_msg = str(e)
+			logger.error(f'Error disconnecting from MCP server: {e}')
+		finally:
+			# Capture telemetry for disconnect action
+			duration = time.time() - start_time
+			self._telemetry.capture(
+				MCPClientTelemetryEvent(
+					server_name=self.server_name,
+					command=self.command,
+					tools_discovered=0,  # Tools cleared on disconnect
+					version=get_browser_use_version(),
+					action='disconnect',
+					duration_seconds=duration,
+					error_message=error_msg,
+				)
+			)
+			self._telemetry.flush()
+	async def register_to_tools(
+		self,
+		tools: Tools,
+		tool_filter: list[str] | None = None,
+		prefix: str | None = None,
+	) -> None:
+		"""Register MCP tools as actions in the browser-use tools.
+		Args:
+			tools: Browser-use tools to register actions to
+			tool_filter: Optional list of tool names to register (None = all tools)
+			prefix: Optional prefix to add to action names (e.g., "playwright_")
+		"""
+		if not self._connected:
+			await self.connect()
+		registry = tools.registry
+		for tool_name, tool in self._tools.items():
+			# Skip if not in filter
+			if tool_filter and tool_name not in tool_filter:
+				continue
+			# Apply prefix if specified
+			action_name = f'{prefix}{tool_name}' if prefix else tool_name
+			# Skip if already registered
+			if action_name in self._registered_actions:
+				continue
+			# Register the tool as an action
+			self._register_tool_as_action(registry, action_name, tool)
+			self._registered_actions.add(action_name)
+		logger.info(f"✅ Registered {len(self._registered_actions)} MCP tools from '{self.server_name}' as browser-use actions")
+	def _register_tool_as_action(self, registry: Registry, action_name: str, tool: Any) -> None:
+		"""Register a single MCP tool as a browser-use action.
+		Args:
+			registry: Browser-use registry to register action to
+			action_name: Name for the registered action
+			tool: MCP Tool object with schema information
+		"""
+		# Parse tool parameters to create Pydantic model
+		param_fields = {}
+		if tool.inputSchema:
+			# MCP tools use JSON Schema for parameters
+			properties = tool.inputSchema.get('properties', {})
+			required = set(tool.inputSchema.get('required', []))
+			for param_name, param_schema in properties.items():
+				# Convert JSON Schema type to Python type
+				param_type = self._json_schema_to_python_type(param_schema, f'{action_name}_{param_name}')
+				# Determine if field is required and handle defaults
+				if param_name in required:
+					default = ...  # Required field
+				else:
+					# Optional field - make type optional and handle default
+					param_type = param_type | None
+					if 'default' in param_schema:
+						default = param_schema['default']
+					else:
+						default = None
+				# Add field with description if available
+				field_kwargs = {}
+				if 'description' in param_schema:
+					field_kwargs['description'] = param_schema['description']
+				param_fields[param_name] = (param_type, Field(default, **field_kwargs))
+		# Create Pydantic model for the tool parameters
+		if param_fields:
+			# Create a BaseModel class with proper configuration
+			class ConfiguredBaseModel(BaseModel):
+				model_config = ConfigDict(extra='forbid', validate_by_name=True, validate_by_alias=True)
+			param_model = create_model(f'{action_name}_Params', __base__=ConfiguredBaseModel, **param_fields)
+		else:
+			# No parameters - create empty model
+			param_model = None
+		# Determine if this is a browser-specific tool
+		is_browser_tool = tool.name.startswith('browser_') or 'page' in tool.name.lower()
+		# Set up action filters
+		domains = None
+		# Note: page_filter has been removed since we no longer use Page objects
+		# Browser tools filtering would need to be done via domain filters instead
+		# Create async wrapper function for the MCP tool
+		# Need to define function with explicit parameters to satisfy registry validation
+		if param_model:
+			# Type 1: Function takes param model as first parameter
+			async def mcp_action_wrapper(params: param_model) -> ActionResult:  # type: ignore[no-redef]
+				"""Wrapper function that calls the MCP tool."""
+				if not self.session or not self._connected:
+					return ActionResult(error=f"MCP server '{self.server_name}' not connected", success=False)
+				# Convert pydantic model to dict for MCP call
+				tool_params = params.model_dump(exclude_none=True)
+				logger.debug(f"🔧 Calling MCP tool '{tool.name}' with params: {tool_params}")
+				start_time = time.time()
+				error_msg = None
+				try:
+					# Call the MCP tool
+					result = await self.session.call_tool(tool.name, tool_params)
+					# Convert MCP result to ActionResult
+					extracted_content = self._format_mcp_result(result)
+					return ActionResult(
+						extracted_content=extracted_content,
+						long_term_memory=f"Used MCP tool '{tool.name}' from {self.server_name}",
+					)
+				except Exception as e:
+					error_msg = f"MCP tool '{tool.name}' failed: {str(e)}"
+					logger.error(error_msg)
+					return ActionResult(error=error_msg, success=False)
+				finally:
+					# Capture telemetry for tool call
+					duration = time.time() - start_time
+					self._telemetry.capture(
+						MCPClientTelemetryEvent(
+							server_name=self.server_name,
+							command=self.command,
+							tools_discovered=len(self._tools),
+							version=get_browser_use_version(),
+							action='tool_call',
+							tool_name=tool.name,
+							duration_seconds=duration,
+							error_message=error_msg,
+						)
+					)
+		else:
+			# No parameters - empty function signature
+			async def mcp_action_wrapper() -> ActionResult:  # type: ignore[no-redef]
+				"""Wrapper function that calls the MCP tool."""
+				if not self.session or not self._connected:
+					return ActionResult(error=f"MCP server '{self.server_name}' not connected", success=False)
+				logger.debug(f"🔧 Calling MCP tool '{tool.name}' with no params")
+				start_time = time.time()
+				error_msg = None
+				try:
+					# Call the MCP tool with empty params
+					result = await self.session.call_tool(tool.name, {})
+					# Convert MCP result to ActionResult
+					extracted_content = self._format_mcp_result(result)
+					return ActionResult(
+						extracted_content=extracted_content,
+						long_term_memory=f"Used MCP tool '{tool.name}' from {self.server_name}",
+					)
+				except Exception as e:
+					error_msg = f"MCP tool '{tool.name}' failed: {str(e)}"
+					logger.error(error_msg)
+					return ActionResult(error=error_msg, success=False)
+				finally:
+					# Capture telemetry for tool call
+					duration = time.time() - start_time
+					self._telemetry.capture(
+						MCPClientTelemetryEvent(
+							server_name=self.server_name,
+							command=self.command,
+							tools_discovered=len(self._tools),
+							version=get_browser_use_version(),
+							action='tool_call',
+							tool_name=tool.name,
+							duration_seconds=duration,
+							error_message=error_msg,
+						)
+					)
+		# Set function metadata for better debugging
+		mcp_action_wrapper.__name__ = action_name
+		mcp_action_wrapper.__qualname__ = f'mcp.{self.server_name}.{action_name}'
+		# Register the action with browser-use
+		description = tool.description or f'MCP tool from {self.server_name}: {tool.name}'
+		# Use the registry's action decorator
+		registry.action(description=description, param_model=param_model, domains=domains)(mcp_action_wrapper)
+		logger.debug(f"✅ Registered MCP tool '{tool.name}' as action '{action_name}'")
+	def _format_mcp_result(self, result: Any) -> str:
+		"""Format MCP tool result into a string for ActionResult.
+		Args:
+			result: Raw result from MCP tool call
+		Returns:
+			Formatted string representation of the result
+		"""
+		# Handle different MCP result formats
+		if hasattr(result, 'content'):
+			# Structured content response
+			if isinstance(result.content, list):
+				# Multiple content items
+				parts = []
+				for item in result.content:
+					if hasattr(item, 'text'):
+						parts.append(item.text)
+					elif hasattr(item, 'type') and item.type == 'text':
+						parts.append(str(item))
+					else:
+						parts.append(str(item))
+				return '\n'.join(parts)
+			else:
+				return str(result.content)
+		elif isinstance(result, list):
+			# List of content items
+			parts = []
+			for item in result:
+				if hasattr(item, 'text'):
+					parts.append(item.text)
+				else:
+					parts.append(str(item))
+			return '\n'.join(parts)
+		else:
+			# Direct result or unknown format
+			return str(result)
+	def _json_schema_to_python_type(self, schema: dict, model_name: str = 'NestedModel') -> Any:
+		"""Convert JSON Schema type to Python type.
+		Args:
+			schema: JSON Schema definition
+			model_name: Name for nested models
+		Returns:
+			Python type corresponding to the schema
+		"""
+		json_type = schema.get('type', 'string')
+		# Basic type mapping
+		type_mapping = {
+			'string': str,
+			'number': float,
+			'integer': int,
+			'boolean': bool,
+			'array': list,
+			'null': type(None),
+		}
+		# Handle enums (they're still strings)
+		if 'enum' in schema:
+			return str
+		# Handle objects with nested properties
+		if json_type == 'object':
+			properties = schema.get('properties', {})
+			if properties:
+				# Create nested pydantic model for objects with properties
+				nested_fields = {}
+				required_fields = set(schema.get('required', []))
+				for prop_name, prop_schema in properties.items():
+					# Recursively process nested properties
+					prop_type = self._json_schema_to_python_type(prop_schema, f'{model_name}_{prop_name}')
+					# Determine if field is required and handle defaults
+					if prop_name in required_fields:
+						default = ...  # Required field
+					else:
+						# Optional field - make type optional and handle default
+						prop_type = prop_type | None
+						if 'default' in prop_schema:
+							default = prop_schema['default']
+						else:
+							default = None
+					# Add field with description if available
+					field_kwargs = {}
+					if 'description' in prop_schema:
+						field_kwargs['description'] = prop_schema['description']
+					nested_fields[prop_name] = (prop_type, Field(default, **field_kwargs))
+				# Create a BaseModel class with proper configuration
+				class ConfiguredBaseModel(BaseModel):
+					model_config = ConfigDict(extra='forbid', validate_by_name=True, validate_by_alias=True)
+				try:
+					# Create and return nested pydantic model
+					return create_model(model_name, __base__=ConfiguredBaseModel, **nested_fields)
+				except Exception as e:
+					logger.error(f'Failed to create nested model {model_name}: {e}')
+					logger.debug(f'Fields: {nested_fields}')
+					# Fallback to basic dict if model creation fails
+					return dict
+			else:
+				# Object without properties - just return dict
+				return dict
+		# Handle arrays with specific item types
+		if json_type == 'array':
+			if 'items' in schema:
+				# Get the item type recursively
+				item_type = self._json_schema_to_python_type(schema['items'], f'{model_name}_item')
+				# Return properly typed list
+				return list[item_type]
+			else:
+				# Array without item type specification
+				return list
+		# Get base type for non-object types
+		base_type = type_mapping.get(json_type, str)
+		# Handle nullable/optional types
+		if schema.get('nullable', False) or json_type == 'null':
+			return base_type | None
+		return base_type
+	async def __aenter__(self):
+		"""Async context manager entry."""
+		await self.connect()
+		return self
+	async def __aexit__(self, exc_type, exc_val, exc_tb):
+		"""Async context manager exit."""
+		await self.disconnect()