PyPI - optexity-browser-use - Versions diffs - 0.9.5__py3-none-any.whl - Mend

optexity-browser-use 0.9.5__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (147) hide show

browser_use/__init__.py +157 -0
browser_use/actor/__init__.py +11 -0
browser_use/actor/element.py +1175 -0
browser_use/actor/mouse.py +134 -0
browser_use/actor/page.py +561 -0
browser_use/actor/playground/flights.py +41 -0
browser_use/actor/playground/mixed_automation.py +54 -0
browser_use/actor/playground/playground.py +236 -0
browser_use/actor/utils.py +176 -0
browser_use/agent/cloud_events.py +282 -0
browser_use/agent/gif.py +424 -0
browser_use/agent/judge.py +170 -0
browser_use/agent/message_manager/service.py +473 -0
browser_use/agent/message_manager/utils.py +52 -0
browser_use/agent/message_manager/views.py +98 -0
browser_use/agent/prompts.py +413 -0
browser_use/agent/service.py +2316 -0
browser_use/agent/system_prompt.md +185 -0
browser_use/agent/system_prompt_flash.md +10 -0
browser_use/agent/system_prompt_no_thinking.md +183 -0
browser_use/agent/views.py +743 -0
browser_use/browser/__init__.py +41 -0
browser_use/browser/cloud/cloud.py +203 -0
browser_use/browser/cloud/views.py +89 -0
browser_use/browser/events.py +578 -0
browser_use/browser/profile.py +1158 -0
browser_use/browser/python_highlights.py +548 -0
browser_use/browser/session.py +3225 -0
browser_use/browser/session_manager.py +399 -0
browser_use/browser/video_recorder.py +162 -0
browser_use/browser/views.py +200 -0
browser_use/browser/watchdog_base.py +260 -0
browser_use/browser/watchdogs/__init__.py +0 -0
browser_use/browser/watchdogs/aboutblank_watchdog.py +253 -0
browser_use/browser/watchdogs/crash_watchdog.py +335 -0
browser_use/browser/watchdogs/default_action_watchdog.py +2729 -0
browser_use/browser/watchdogs/dom_watchdog.py +817 -0
browser_use/browser/watchdogs/downloads_watchdog.py +1277 -0
browser_use/browser/watchdogs/local_browser_watchdog.py +461 -0
browser_use/browser/watchdogs/permissions_watchdog.py +43 -0
browser_use/browser/watchdogs/popups_watchdog.py +143 -0
browser_use/browser/watchdogs/recording_watchdog.py +126 -0
browser_use/browser/watchdogs/screenshot_watchdog.py +62 -0
browser_use/browser/watchdogs/security_watchdog.py +280 -0
browser_use/browser/watchdogs/storage_state_watchdog.py +335 -0
browser_use/cli.py +2359 -0
browser_use/code_use/__init__.py +16 -0
browser_use/code_use/formatting.py +192 -0
browser_use/code_use/namespace.py +665 -0
browser_use/code_use/notebook_export.py +276 -0
browser_use/code_use/service.py +1340 -0
browser_use/code_use/system_prompt.md +574 -0
browser_use/code_use/utils.py +150 -0
browser_use/code_use/views.py +171 -0
browser_use/config.py +505 -0
browser_use/controller/__init__.py +3 -0
browser_use/dom/enhanced_snapshot.py +161 -0
browser_use/dom/markdown_extractor.py +169 -0
browser_use/dom/playground/extraction.py +312 -0
browser_use/dom/playground/multi_act.py +32 -0
browser_use/dom/serializer/clickable_elements.py +200 -0
browser_use/dom/serializer/code_use_serializer.py +287 -0
browser_use/dom/serializer/eval_serializer.py +478 -0
browser_use/dom/serializer/html_serializer.py +212 -0
browser_use/dom/serializer/paint_order.py +197 -0
browser_use/dom/serializer/serializer.py +1170 -0
browser_use/dom/service.py +825 -0
browser_use/dom/utils.py +129 -0
browser_use/dom/views.py +906 -0
browser_use/exceptions.py +5 -0
browser_use/filesystem/__init__.py +0 -0
browser_use/filesystem/file_system.py +619 -0
browser_use/init_cmd.py +376 -0
browser_use/integrations/gmail/__init__.py +24 -0
browser_use/integrations/gmail/actions.py +115 -0
browser_use/integrations/gmail/service.py +225 -0
browser_use/llm/__init__.py +155 -0
browser_use/llm/anthropic/chat.py +242 -0
browser_use/llm/anthropic/serializer.py +312 -0
browser_use/llm/aws/__init__.py +36 -0
browser_use/llm/aws/chat_anthropic.py +242 -0
browser_use/llm/aws/chat_bedrock.py +289 -0
browser_use/llm/aws/serializer.py +257 -0
browser_use/llm/azure/chat.py +91 -0
browser_use/llm/base.py +57 -0
browser_use/llm/browser_use/__init__.py +3 -0
browser_use/llm/browser_use/chat.py +201 -0
browser_use/llm/cerebras/chat.py +193 -0
browser_use/llm/cerebras/serializer.py +109 -0
browser_use/llm/deepseek/chat.py +212 -0
browser_use/llm/deepseek/serializer.py +109 -0
browser_use/llm/exceptions.py +29 -0
browser_use/llm/google/__init__.py +3 -0
browser_use/llm/google/chat.py +542 -0
browser_use/llm/google/serializer.py +120 -0
browser_use/llm/groq/chat.py +229 -0
browser_use/llm/groq/parser.py +158 -0
browser_use/llm/groq/serializer.py +159 -0
browser_use/llm/messages.py +238 -0
browser_use/llm/models.py +271 -0
browser_use/llm/oci_raw/__init__.py +10 -0
browser_use/llm/oci_raw/chat.py +443 -0
browser_use/llm/oci_raw/serializer.py +229 -0
browser_use/llm/ollama/chat.py +97 -0
browser_use/llm/ollama/serializer.py +143 -0
browser_use/llm/openai/chat.py +264 -0
browser_use/llm/openai/like.py +15 -0
browser_use/llm/openai/serializer.py +165 -0
browser_use/llm/openrouter/chat.py +211 -0
browser_use/llm/openrouter/serializer.py +26 -0
browser_use/llm/schema.py +176 -0
browser_use/llm/views.py +48 -0
browser_use/logging_config.py +330 -0
browser_use/mcp/__init__.py +18 -0
browser_use/mcp/__main__.py +12 -0
browser_use/mcp/client.py +544 -0
browser_use/mcp/controller.py +264 -0
browser_use/mcp/server.py +1114 -0
browser_use/observability.py +204 -0
browser_use/py.typed +0 -0
browser_use/sandbox/__init__.py +41 -0
browser_use/sandbox/sandbox.py +637 -0
browser_use/sandbox/views.py +132 -0
browser_use/screenshots/__init__.py +1 -0
browser_use/screenshots/service.py +52 -0
browser_use/sync/__init__.py +6 -0
browser_use/sync/auth.py +357 -0
browser_use/sync/service.py +161 -0
browser_use/telemetry/__init__.py +51 -0
browser_use/telemetry/service.py +112 -0
browser_use/telemetry/views.py +101 -0
browser_use/tokens/__init__.py +0 -0
browser_use/tokens/custom_pricing.py +24 -0
browser_use/tokens/mappings.py +4 -0
browser_use/tokens/service.py +580 -0
browser_use/tokens/views.py +108 -0
browser_use/tools/registry/service.py +572 -0
browser_use/tools/registry/views.py +174 -0
browser_use/tools/service.py +1675 -0
browser_use/tools/utils.py +82 -0
browser_use/tools/views.py +100 -0
browser_use/utils.py +670 -0
optexity_browser_use-0.9.5.dist-info/METADATA +344 -0
optexity_browser_use-0.9.5.dist-info/RECORD +147 -0
optexity_browser_use-0.9.5.dist-info/WHEEL +4 -0
optexity_browser_use-0.9.5.dist-info/entry_points.txt +3 -0
optexity_browser_use-0.9.5.dist-info/licenses/LICENSE +21 -0

browser_use/code_use/utils.py ADDED Viewed

@@ -0,0 +1,150 @@
+"""Utility functions for code-use agent."""
+import re
+def truncate_message_content(content: str, max_length: int = 10000) -> str:
+	"""Truncate message content to max_length characters for history."""
+	if len(content) <= max_length:
+		return content
+	# Truncate and add marker
+	return content[:max_length] + f'\n\n[... truncated {len(content) - max_length} characters for history]'
+def detect_token_limit_issue(
+	completion: str,
+	completion_tokens: int | None,
+	max_tokens: int | None,
+	stop_reason: str | None,
+) -> tuple[bool, str | None]:
+	"""
+	Detect if the LLM response hit token limits or is repetitive garbage.
+	Returns: (is_problematic, error_message)
+	"""
+	# Check 1: Stop reason indicates max_tokens
+	if stop_reason == 'max_tokens':
+		return True, f'Response terminated due to max_tokens limit (stop_reason: {stop_reason})'
+	# Check 2: Used 90%+ of max_tokens (if we have both values)
+	if completion_tokens is not None and max_tokens is not None and max_tokens > 0:
+		usage_ratio = completion_tokens / max_tokens
+		if usage_ratio >= 0.9:
+			return True, f'Response used {usage_ratio:.1%} of max_tokens ({completion_tokens}/{max_tokens})'
+	# Check 3: Last 6 characters repeat 40+ times (repetitive garbage)
+	if len(completion) >= 6:
+		last_6 = completion[-6:]
+		repetition_count = completion.count(last_6)
+		if repetition_count >= 40:
+			return True, f'Repetitive output detected: last 6 chars "{last_6}" appears {repetition_count} times'
+	return False, None
+def extract_url_from_task(task: str) -> str | None:
+	"""Extract URL from task string using naive pattern matching."""
+	# Remove email addresses from task before looking for URLs
+	task_without_emails = re.sub(r'\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b', '', task)
+	# Look for common URL patterns
+	patterns = [
+		r'https?://[^\s<>"\']+',  # Full URLs with http/https
+		r'(?:www\.)?[a-zA-Z0-9-]+(?:\.[a-zA-Z0-9-]+)*\.[a-zA-Z]{2,}(?:/[^\s<>"\']*)?',  # Domain names with subdomains and optional paths
+	]
+	found_urls = []
+	for pattern in patterns:
+		matches = re.finditer(pattern, task_without_emails)
+		for match in matches:
+			url = match.group(0)
+			# Remove trailing punctuation that's not part of URLs
+			url = re.sub(r'[.,;:!?()\[\]]+$', '', url)
+			# Add https:// if missing
+			if not url.startswith(('http://', 'https://')):
+				url = 'https://' + url
+			found_urls.append(url)
+	unique_urls = list(set(found_urls))
+	# If multiple URLs found, skip auto-navigation to avoid ambiguity
+	if len(unique_urls) > 1:
+		return None
+	# If exactly one URL found, return it
+	if len(unique_urls) == 1:
+		return unique_urls[0]
+	return None
+def extract_code_blocks(text: str) -> dict[str, str]:
+	"""Extract all code blocks from markdown response.
+	Supports:
+	- ```python, ```js, ```javascript, ```bash, ```markdown, ```md
+	- Named blocks: ```js variable_name → saved as 'variable_name' in namespace
+	- Nested blocks: Use 4+ backticks for outer block when inner content has 3 backticks
+	Returns dict mapping block_name -> content
+	Note: Python blocks are NO LONGER COMBINED. Each python block executes separately
+	to allow sequential execution with JS/bash blocks in between.
+	"""
+	# Pattern to match code blocks with language identifier and optional variable name
+	# Matches: ```lang\n or ```lang varname\n or ````+lang\n (4+ backticks for nested blocks)
+	# Uses non-greedy matching and backreferences to match opening/closing backticks
+	pattern = r'(`{3,})(\w+)(?:\s+(\w+))?\n(.*?)\1(?:\n|$)'
+	matches = re.findall(pattern, text, re.DOTALL)
+	blocks: dict[str, str] = {}
+	python_block_counter = 0
+	for backticks, lang, var_name, content in matches:
+		lang = lang.lower()
+		# Normalize language names
+		if lang in ('javascript', 'js'):
+			lang_normalized = 'js'
+		elif lang in ('markdown', 'md'):
+			lang_normalized = 'markdown'
+		elif lang in ('sh', 'shell'):
+			lang_normalized = 'bash'
+		elif lang == 'python':
+			lang_normalized = 'python'
+		else:
+			# Unknown language, skip
+			continue
+		# Only process supported types
+		if lang_normalized in ('python', 'js', 'bash', 'markdown'):
+			content = content.rstrip()  # Only strip trailing whitespace, preserve leading for indentation
+			if content:
+				# Determine the key to use
+				if var_name:
+					# Named block - use the variable name
+					block_key = var_name
+					blocks[block_key] = content
+				elif lang_normalized == 'python':
+					# Unnamed Python blocks - give each a unique key to preserve order
+					block_key = f'python_{python_block_counter}'
+					blocks[block_key] = content
+					python_block_counter += 1
+				else:
+					# Other unnamed blocks (js, bash, markdown) - keep last one only
+					blocks[lang_normalized] = content
+	# If we have multiple python blocks, mark the first one as 'python' for backward compat
+	if python_block_counter > 0:
+		blocks['python'] = blocks['python_0']
+	# Fallback: if no python block but there's generic ``` block, treat as python
+	if python_block_counter == 0 and 'python' not in blocks:
+		generic_pattern = r'```\n(.*?)```'
+		generic_matches = re.findall(generic_pattern, text, re.DOTALL)
+		if generic_matches:
+			combined = '\n\n'.join(m.strip() for m in generic_matches if m.strip())
+			if combined:
+				blocks['python'] = combined
+	return blocks

browser_use/code_use/views.py ADDED Viewed

@@ -0,0 +1,171 @@
+"""Data models for code-use mode."""
+from enum import Enum
+from typing import Any
+from pydantic import BaseModel, ConfigDict, Field
+from uuid_extensions import uuid7str
+class CellType(str, Enum):
+	"""Type of notebook cell."""
+	CODE = 'code'
+	MARKDOWN = 'markdown'
+class ExecutionStatus(str, Enum):
+	"""Execution status of a cell."""
+	PENDING = 'pending'
+	RUNNING = 'running'
+	SUCCESS = 'success'
+	ERROR = 'error'
+class CodeCell(BaseModel):
+	"""Represents a code cell in the notebook-like execution."""
+	model_config = ConfigDict(extra='forbid')
+	id: str = Field(default_factory=uuid7str)
+	cell_type: CellType = CellType.CODE
+	source: str = Field(description='The code to execute')
+	output: str | None = Field(default=None, description='The output of the code execution')
+	execution_count: int | None = Field(default=None, description='The execution count')
+	status: ExecutionStatus = Field(default=ExecutionStatus.PENDING)
+	error: str | None = Field(default=None, description='Error message if execution failed')
+	browser_state: str | None = Field(default=None, description='Browser state after execution')
+class NotebookSession(BaseModel):
+	"""Represents a notebook-like session."""
+	model_config = ConfigDict(extra='forbid')
+	id: str = Field(default_factory=uuid7str)
+	cells: list[CodeCell] = Field(default_factory=list)
+	current_execution_count: int = Field(default=0)
+	namespace: dict[str, Any] = Field(default_factory=dict, description='Current namespace state')
+	def add_cell(self, source: str) -> CodeCell:
+		"""Add a new code cell to the session."""
+		cell = CodeCell(source=source)
+		self.cells.append(cell)
+		return cell
+	def get_cell(self, cell_id: str) -> CodeCell | None:
+		"""Get a cell by ID."""
+		for cell in self.cells:
+			if cell.id == cell_id:
+				return cell
+		return None
+	def get_latest_cell(self) -> CodeCell | None:
+		"""Get the most recently added cell."""
+		if self.cells:
+			return self.cells[-1]
+		return None
+	def increment_execution_count(self) -> int:
+		"""Increment and return the execution count."""
+		self.current_execution_count += 1
+		return self.current_execution_count
+class NotebookExport(BaseModel):
+	"""Export format for Jupyter notebook."""
+	model_config = ConfigDict(extra='forbid')
+	nbformat: int = Field(default=4)
+	nbformat_minor: int = Field(default=5)
+	metadata: dict[str, Any] = Field(default_factory=dict)
+	cells: list[dict[str, Any]] = Field(default_factory=list)
+class CodeAgentModelOutput(BaseModel):
+	"""Model output for CodeAgent - contains the code and full LLM response."""
+	model_config = ConfigDict(extra='forbid')
+	model_output: str = Field(description='The extracted code from the LLM response')
+	full_response: str = Field(description='The complete LLM response including any text/reasoning')
+class CodeAgentResult(BaseModel):
+	"""Result of executing a code cell in CodeAgent."""
+	model_config = ConfigDict(extra='forbid')
+	extracted_content: str | None = Field(default=None, description='Output from code execution')
+	error: str | None = Field(default=None, description='Error message if execution failed')
+	is_done: bool = Field(default=False, description='Whether task is marked as done')
+	success: bool | None = Field(default=None, description='Self-reported success from done() call')
+class CodeAgentState(BaseModel):
+	"""State information for a CodeAgent step."""
+	model_config = ConfigDict(extra='forbid', arbitrary_types_allowed=True)
+	url: str | None = Field(default=None, description='Current page URL')
+	title: str | None = Field(default=None, description='Current page title')
+	screenshot_path: str | None = Field(default=None, description='Path to screenshot file')
+	def get_screenshot(self) -> str | None:
+		"""Load screenshot from disk and return as base64 string."""
+		if not self.screenshot_path:
+			return None
+		import base64
+		from pathlib import Path
+		path_obj = Path(self.screenshot_path)
+		if not path_obj.exists():
+			return None
+		try:
+			with open(path_obj, 'rb') as f:
+				screenshot_data = f.read()
+			return base64.b64encode(screenshot_data).decode('utf-8')
+		except Exception:
+			return None
+class CodeAgentStepMetadata(BaseModel):
+	"""Metadata for a single CodeAgent step including timing and token information."""
+	model_config = ConfigDict(extra='forbid')
+	input_tokens: int | None = Field(default=None, description='Number of input tokens used')
+	output_tokens: int | None = Field(default=None, description='Number of output tokens used')
+	step_start_time: float = Field(description='Step start timestamp (Unix time)')
+	step_end_time: float = Field(description='Step end timestamp (Unix time)')
+	@property
+	def duration_seconds(self) -> float:
+		"""Calculate step duration in seconds."""
+		return self.step_end_time - self.step_start_time
+class CodeAgentHistory(BaseModel):
+	"""History item for CodeAgent actions."""
+	model_config = ConfigDict(extra='forbid', arbitrary_types_allowed=True)
+	model_output: CodeAgentModelOutput | None = Field(default=None, description='LLM output for this step')
+	result: list[CodeAgentResult] = Field(default_factory=list, description='Results from code execution')
+	state: CodeAgentState = Field(description='Browser state at this step')
+	metadata: CodeAgentStepMetadata | None = Field(default=None, description='Step timing and token metadata')
+	screenshot_path: str | None = Field(default=None, description='Legacy field for screenshot path')
+	def model_dump(self, **kwargs) -> dict[str, Any]:
+		"""Custom serialization for CodeAgentHistory."""
+		return {
+			'model_output': self.model_output.model_dump() if self.model_output else None,
+			'result': [r.model_dump() for r in self.result],
+			'state': self.state.model_dump(),
+			'metadata': self.metadata.model_dump() if self.metadata else None,
+			'screenshot_path': self.screenshot_path,
+		}