PyPI - semantio - Versions diffs - 0.0.3__py3-none-any.whl → 0.0.4__py3-none-any.whl - Mend

semantio 0.0.3py3-none-any.whl → 0.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

semantio/agent.py CHANGED Viewed

@@ -56,8 +56,11 @@ class Agent(BaseModel):
         super().__init__(**kwargs)
         # Initialize the model and tools here if needed
         self._initialize_model()
-        # Automatically discover and register tools if not provided
+        # Initialize tools as an empty list if not provided
         if self.tools is None:
+            self.tools = []
+        # Automatically discover and register tools if auto tool is enabled
+        if self.auto_tool and not self.tools:
             self.tools = self._discover_tools()
         # Pass the LLM instance to each tool
         for tool in self.tools:
@@ -213,7 +216,6 @@ class Agent(BaseModel):
         message: Optional[Union[str, Image, List, Dict]] = None,
         stream: bool = False,
         markdown: bool = False,
-        tools: Optional[List[BaseTool]] = None,
         team: Optional[List['Agent']] = None,
         **kwargs,
     ) -> Union[str, Dict]:  # Add return type hint
@@ -228,7 +230,7 @@ class Agent(BaseModel):
             return response
         else:
             # Generate and return the response
-            response = self._generate_response(message, markdown=markdown, tools=tools, team=team, **kwargs)
+            response = self._generate_response(message, markdown=markdown, team=team, **kwargs)
             print(response)  # Print the response to the console
             return response
@@ -245,43 +247,6 @@ class Agent(BaseModel):
         if self.tools is None:
             self.tools = []
         self.tools.append(tool)
-    def _detect_tool_call(self, message: str) -> Optional[Dict[str, Any]]:
-        """
-        Use the LLM to detect which tool should be called based on the user's query.
-        """
-        if not self.tools:
-            logger.warning("No tools available to detect.")
-            return None
-        # Create a prompt for the LLM
-        prompt = f"""
-        You are an AI agent that helps users by selecting the most appropriate tool to answer their query. Below is a list of available tools and their functionalities:
-        {self._get_tool_descriptions()}
-        Based on the user's query, select the most appropriate tool. Respond with the name of the tool (e.g., "CryptoPriceChecker"). If no tool is suitable, respond with "None".
-        User Query: "{message}"
-        """
-        try:
-            # Call the LLM to generate the response
-            response = self.llm_instance.generate(prompt=prompt)
-            tool_name = response.strip().replace('"', '').replace("'", "")
-            # Find the tool in the list of available tools
-            tool = next((t for t in self.tools if t.name.lower() == tool_name.lower()), None)
-            if tool:
-                logger.info(f"Detected tool call: {tool.name}")
-                return {
-                    "tool": tool.name,
-                    "input": {"query": message}
-                }
-        except Exception as e:
-            logger.error(f"Failed to detect tool call: {e}")
-        return None
     def _analyze_query_and_select_tools(self, query: str) -> List[Dict[str, Any]]:
         """
@@ -324,17 +289,16 @@ class Agent(BaseModel):
             return []
-    def _generate_response(self, message: str, markdown: bool = False, tools: Optional[List[BaseTool]] = None, team: Optional[List['Agent']] = None, **kwargs) -> str:
+    def _generate_response(self, message: str, markdown: bool = False, team: Optional[List['Agent']] = None, **kwargs) -> str:
         """Generate the agent's response, including tool execution and context retrieval."""
-        # Use the specified tools or team if provided
-        if tools is not None:
-            self.tools = tools
+        # Use the specified team if provided
         if team is not None:
             return self._generate_team_response(message, team, markdown=markdown, **kwargs)
         # Initialize tool_outputs as an empty dictionary
         tool_outputs = {}
         responses = []
+        tool_calls = []
         # Use the LLM to analyze the query and dynamically select tools when auto_tool is enabled
         if self.auto_tool:
@@ -344,7 +308,7 @@ class Agent(BaseModel):
             if self.tools:
                 tool_calls = [
                     {
-                        "tool": tool.__class__.__name__,
+                        "tool": tool.name,
                         "input": {
                             "query": message,  # Use the message as the query
                             "context": None,  # No context provided by default
@@ -352,10 +316,8 @@ class Agent(BaseModel):
                     }
                     for tool in self.tools
                 ]
-            else:
-                tool_calls = kwargs.get("tool_calls", [])
-            # Execute tools if any are detected
+        # Execute tools if any are detected
         if tool_calls:
             for tool_call in tool_calls:
                 tool_name = tool_call["tool"]
@@ -396,7 +358,7 @@ class Agent(BaseModel):
             except Exception as e:
                 logger.error(f"Failed to generate LLM response: {e}")
                 responses.append(f"An error occurred while generating the analysis: {e}")
-        if not tool_calls:
+        if not self.tools and not tool_calls:
             # If no tools were executed, proceed with the original logic
             # Retrieve relevant context using RAG
             rag_context = self.rag.retrieve(message) if self.rag else None

semantio/tools/web_browser.py ADDED Viewed

@@ -0,0 +1,271 @@
+# web_browser.py
+from typing import Dict, Any, List, Optional
+from pydantic import Field, BaseModel
+from selenium import webdriver
+from selenium.webdriver.common.by import By
+from selenium.webdriver.support.ui import WebDriverWait
+from selenium.webdriver.support import expected_conditions as EC
+from selenium.webdriver.chrome.options import Options
+from selenium.webdriver.chrome.service import Service
+from webdriver_manager.chrome import ChromeDriverManager
+from bs4 import BeautifulSoup
+import json
+import time
+import re
+import logging
+from .base_tool import BaseTool
+logger = logging.getLogger(__name__)
+class BrowserPlan(BaseModel):
+    tasks: List[Dict[str, Any]] = Field(
+        ...,
+        description="List of automation tasks to execute"
+    )
+class WebBrowserTool(BaseTool):
+    name: str = Field("WebBrowser", description="Name of the tool")
+    description: str = Field(
+        "Universal web automation tool for dynamic website interactions",
+        description="Tool description"
+    )
+    def execute(self, input: Dict[str, Any]) -> Dict[str, Any]:
+        """Execute dynamic web automation workflow"""
+        driver = None
+        try:
+            driver = self._init_browser(input.get("headless", False))
+            results = []
+            current_url = ""
+            # Generate initial plan
+            plan = self._generate_plan(input['query'], current_url)
+            for task in plan.tasks:
+                result = self._execute_safe_task(driver, task)
+                results.append(result)
+                if not result['success']:
+                    break
+                # Update context for next tasks
+                current_url = driver.current_url
+            return {"status": "success", "results": results}
+        except Exception as e:
+            return {"status": "error", "message": str(e)}
+        finally:
+            if driver:
+                driver.quit()
+    def _init_browser(self, headless: bool) -> webdriver.Chrome:
+        """Initialize browser with advanced options"""
+        options = Options()
+        options.add_argument("--start-maximized")
+        options.add_argument("--disable-blink-features=AutomationControlled")
+        options.add_experimental_option("excludeSwitches", ["enable-automation"])
+        if headless:
+            options.add_argument("--headless=new")
+        return webdriver.Chrome(
+            service=Service(ChromeDriverManager().install()),
+            options=options
+        )
+    def _generate_plan(self, query: str, current_url: str) -> BrowserPlan:
+        """Generate adaptive execution plan using LLM"""
+        prompt = f"""Generate browser automation plan for: {query}
+        Current URL: {current_url or 'No page loaded yet'}
+        Required JSON format:
+        {{
+            "tasks": [
+                {{
+                    "action": "navigate|click|type|wait|scroll",
+                    "selector": "CSS selector (optional)",
+                    "value": "input text/URL/seconds",
+                    "description": "action purpose"
+                }}
+            ]
+        }}
+        Guidelines:
+        1. Prefer IDs in selectors (#element-id)
+        2. Use semantic attributes (aria-label, name)
+        3. Include wait steps after navigation
+        4. Prioritize visible elements
+        5. Add scroll steps for hidden elements
+        """
+        response = self.llm.generate(prompt=prompt)
+        return self._parse_plan(response)
+    def _parse_plan(self, response: str) -> BrowserPlan:
+        """Robust JSON parsing with multiple fallback strategies"""
+        try:
+            # Try extracting JSON from markdown code block
+            json_match = re.search(r'```json\n?(.+?)\n?```', response, re.DOTALL)
+            if json_match:
+                plan_data = json.loads(json_match.group(1).strip())
+            else:
+                # Fallback to extract first JSON object
+                json_str = re.search(r'\{.*\}', response, re.DOTALL).group()
+                plan_data = json.loads(json_str)
+            # Validate tasks structure
+            validated_tasks = []
+            for task in plan_data.get("tasks", []):
+                if not all(key in task for key in ["action", "description"]):
+                    continue
+                validated_tasks.append({
+                    "action": task["action"],
+                    "selector": task.get("selector", ""),
+                    "value": task.get("value", ""),
+                    "description": task["description"]
+                })
+            return BrowserPlan(tasks=validated_tasks)
+        except (json.JSONDecodeError, AttributeError) as e:
+            logger.error(f"Plan parsing failed: {e}")
+            return BrowserPlan(tasks=[])
+    def _execute_safe_task(self, driver, task: Dict) -> Dict[str, Any]:
+        """Execute task with comprehensive error handling"""
+        try:
+            action = task["action"].lower()
+            selector = task.get("selector", "")
+            value = task.get("value", "")
+            if action == "navigate":
+                return self._handle_navigation(driver, value)
+            elif action == "click":
+                return self._handle_click(driver, selector)
+            elif action == "type":
+                return self._handle_typing(driver, selector, value)
+            elif action == "wait":
+                return self._handle_wait(value)
+            elif action == "scroll":
+                return self._handle_scroll(driver, selector)
+            return {
+                "action": action,
+                "success": False,
+                "message": f"Unsupported action: {action}"
+            }
+        except Exception as e:
+            return {
+                "action": action,
+                "success": False,
+                "message": f"Critical error: {str(e)}"
+            }
+    def _handle_navigation(self, driver, url: str) -> Dict[str, Any]:
+        """Smart navigation handler"""
+        if not url.startswith(("http://", "https://")):
+            url = f"https://{url}"
+        try:
+            driver.get(url)
+            WebDriverWait(driver, 15).until(
+                EC.presence_of_element_located((By.TAG_NAME, "body"))
+            )
+            return {
+                "action": "navigate",
+                "success": True,
+                "message": f"Navigated to {url}"
+            }
+        except Exception as e:
+            return {
+                "action": "navigate",
+                "success": False,
+                "message": f"Navigation failed: {str(e)}"
+            }
+    def _handle_click(self, driver, selector: str) -> Dict[str, Any]:
+        """Dynamic click handler"""
+        try:
+            element = WebDriverWait(driver, 15).until(
+                EC.element_to_be_clickable((By.CSS_SELECTOR, selector))
+            )
+            driver.execute_script("arguments[0].scrollIntoView({behavior: 'smooth'});", element)
+            element.click()
+            return {
+                "action": "click",
+                "success": True,
+                "message": f"Clicked element: {selector}"
+            }
+        except Exception as e:
+            return {
+                "action": "click",
+                "success": False,
+                "message": f"Click failed: {str(e)}"
+            }
+    def _handle_typing(self, driver, selector: str, text: str) -> Dict[str, Any]:
+        """Universal typing handler"""
+        try:
+            element = WebDriverWait(driver, 15).until(
+                EC.presence_of_element_located((By.CSS_SELECTOR, selector))
+            )
+            element.clear()
+            element.send_keys(text)
+            return {
+                "action": "type",
+                "success": True,
+                "message": f"Typed '{text}' into {selector}"
+            }
+        except Exception as e:
+            return {
+                "action": "type",
+                "success": False,
+                "message": f"Typing failed: {str(e)}"
+            }
+    def _handle_wait(self, seconds: str) -> Dict[str, Any]:
+        """Configurable wait handler"""
+        try:
+            wait_time = float(seconds)
+            time.sleep(wait_time)
+            return {
+                "action": "wait",
+                "success": True,
+                "message": f"Waited {wait_time} seconds"
+            }
+        except ValueError:
+            return {
+                "action": "wait",
+                "success": False,
+                "message": "Invalid wait time"
+            }
+    def _handle_scroll(self, driver, selector: str) -> Dict[str, Any]:
+        """Smart scroll handler"""
+        try:
+            if selector:
+                element = WebDriverWait(driver, 15).until(
+                    EC.presence_of_element_located((By.CSS_SELECTOR, selector))
+                )
+                driver.execute_script("arguments[0].scrollIntoView({behavior: 'smooth'});", element)
+            else:
+                driver.execute_script("window.scrollTo(0, document.body.scrollHeight);")
+            return {
+                "action": "scroll",
+                "success": True,
+                "message": f"Scrolled to {selector or 'page bottom'}"
+            }
+        except Exception as e:
+            return {
+                "action": "scroll",
+                "success": False,
+                "message": f"Scroll failed: {str(e)}"
+            }

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: semantio
-Version: 0.0.3
+Version: 0.0.4
 Summary: A powerful SDK for building AI agents
 Home-page: https://github.com/Syenah/semantio
 Author: Rakesh
@@ -33,6 +33,10 @@ Requires-Dist: sentence-transformers
 Requires-Dist: fuzzywuzzy
 Requires-Dist: duckduckgo-search
 Requires-Dist: yfinance
+Requires-Dist: selenium
+Requires-Dist: beautifulsoup4
+Requires-Dist: webdriver-manager
+Requires-Dist: validators
 # Semantio: The Mother of Your AI Agents

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 semantio/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-semantio/agent.py,sha256=plQ4D76cnJ1FaGlEuKDeA53aW_hMDvt5sbmUuTHqvFQ,30143
+semantio/agent.py,sha256=hKytSI5LqNnxqVvwI2hOINqPgrdhUXY9MS_90_crZPs,28584
 semantio/memory.py,sha256=eNAwyAokppHzMcIyFgOw2hT2wnLQBd9GL4T5eallNV4,281
 semantio/rag.py,sha256=ROy3Pa1NURcDs6qQZ8IMoa5Xlzt6I-msEq0C1p8UgB0,472
 semantio/api/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -27,15 +27,16 @@ semantio/tools/base_tool.py,sha256=xBNSa_8a8WmA4BGRLG2dE7wj9GnBcZo7-P2SyD86GvY,5
 semantio/tools/crypto.py,sha256=mut1ztvpPcUUP3b563dh_FmKtP68KmNis3Qm8WENj8w,5559
 semantio/tools/duckduckgo.py,sha256=6mGn0js0cIsVxQlAgB8AYNLP05H8WmJKnSVosiO9iH0,5034
 semantio/tools/stocks.py,sha256=BVuK61O9OmWQjj0YdiCJY6TzpiFJ_An1UJB2RkDfX2k,5393
+semantio/tools/web_browser.py,sha256=wqr5pj2GybkK9IHDb8C1BipS8ujV2l36WlwA8ZbKd88,9711
 semantio/utils/__init__.py,sha256=Lx4X4iJpRhZzRmpQb80XXh5Ve8ZMOkadWAxXSmHpO_8,244
 semantio/utils/config.py,sha256=ZTwUTqxjW3-w94zoU7GzivWyJe0JJGvBfuB4RUOuEs8,1198
 semantio/utils/date_utils.py,sha256=x3oqRGv6ee_KCJ0LvCqqZh_FSgS6YGOHBwZQS4TJetY,1471
 semantio/utils/file_utils.py,sha256=b_cMuJINEGk9ikNuNHSn9lsmICWwvtnCDZ03ndH_S2I,1779
 semantio/utils/logger.py,sha256=TmGbP8BRjLMWjXi2GWzZ0RIXt70x9qX3FuIqghCNlwM,510
 semantio/utils/validation_utils.py,sha256=iwoxEb4Q5ILqV6tbesMjPWPCCoL3AmPLejGUy6q8YvQ,1284
-semantio-0.0.3.dist-info/LICENSE,sha256=teQbWD2Zlcl1_Fo29o2tNbs6G26hbCQiUzds5fQGYlY,1063
-semantio-0.0.3.dist-info/METADATA,sha256=M5Q-waTknpyWrD_HV9G76jMKgPHPrBBwM5Hl8we4ulo,6800
-semantio-0.0.3.dist-info/WHEEL,sha256=ewwEueio1C2XeHTvT17n8dZUJgOvyCWCt0WVNLClP9o,92
-semantio-0.0.3.dist-info/entry_points.txt,sha256=zbPgevSLwcLpdRHqI_atE8EOt8lK2vRF1AoDflDTo18,53
-semantio-0.0.3.dist-info/top_level.txt,sha256=Yte_6mb-bh-I_lQwMjk1GijZkxPoX4Zmp3kBftC1ZlA,9
-semantio-0.0.3.dist-info/RECORD,,
+semantio-0.0.4.dist-info/LICENSE,sha256=teQbWD2Zlcl1_Fo29o2tNbs6G26hbCQiUzds5fQGYlY,1063
+semantio-0.0.4.dist-info/METADATA,sha256=youxODbkR3gNERG-mD7zbUbe5ix-0lUiWCHUI1_Y5IY,6913
+semantio-0.0.4.dist-info/WHEEL,sha256=ewwEueio1C2XeHTvT17n8dZUJgOvyCWCt0WVNLClP9o,92
+semantio-0.0.4.dist-info/entry_points.txt,sha256=zbPgevSLwcLpdRHqI_atE8EOt8lK2vRF1AoDflDTo18,53
+semantio-0.0.4.dist-info/top_level.txt,sha256=Yte_6mb-bh-I_lQwMjk1GijZkxPoX4Zmp3kBftC1ZlA,9
+semantio-0.0.4.dist-info/RECORD,,

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/LICENSE RENAMED Viewed

File without changes

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/WHEEL RENAMED Viewed

File without changes

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{semantio-0.0.3.dist-info → semantio-0.0.4.dist-info}/top_level.txt RENAMED Viewed

File without changes

semantio 0.0.3__py3-none-any.whl → 0.0.4__py3-none-any.whl

semantio 0.0.3py3-none-any.whl → 0.0.4py3-none-any.whl