PyPI - semantio - Versions diffs - 0.0.2__tar.gz → 0.0.4__tar.gz - Mend

semantio 0.0.2tar.gz → 0.0.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

{semantio-0.0.2 → semantio-0.0.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: semantio
-Version: 0.0.2
+Version: 0.0.4
 Summary: A powerful SDK for building AI agents
 Home-page: https://github.com/Syenah/semantio
 Author: Rakesh

{semantio-0.0.2 → semantio-0.0.4}/semantio/agent.py RENAMED Viewed

@@ -21,24 +21,24 @@ import os
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-class Assistant(BaseModel):
+class Agent(BaseModel):
     # -*- Agent settings
-    name: Optional[str] = Field(None, description="Name of the assistant.")
-    description: Optional[str] = Field(None, description="Description of the assistant's role.")
-    instructions: Optional[List[str]] = Field(None, description="List of instructions for the assistant.")
+    name: Optional[str] = Field(None, description="Name of the agent.")
+    description: Optional[str] = Field(None, description="Description of the agent's role.")
+    instructions: Optional[List[str]] = Field(None, description="List of instructions for the agent.")
     model: Optional[str] = Field(None, description="This one is not in the use.")
     show_tool_calls: bool = Field(False, description="Whether to show tool calls in the response.")
     markdown: bool = Field(False, description="Whether to format the response in markdown.")
-    tools: Optional[List[BaseTool]] = Field(None, description="List of tools available to the assistant.")
-    user_name: Optional[str] = Field("User", description="Name of the user interacting with the assistant.")
-    emoji: Optional[str] = Field(":robot:", description="Emoji to represent the assistant in the CLI.")
+    tools: Optional[List[BaseTool]] = Field(None, description="List of tools available to the agent.")
+    user_name: Optional[str] = Field("User", description="Name of the user interacting with the agent.")
+    emoji: Optional[str] = Field(":robot:", description="Emoji to represent the agent in the CLI.")
     rag: Optional[RAG] = Field(None, description="RAG instance for context retrieval.")
     knowledge_base: Optional[Any] = Field(None, description="Knowledge base for domain-specific information.")
     llm: Optional[str] = Field(None, description="The LLM provider to use (e.g., 'groq', 'openai', 'anthropic').")
     llm_model: Optional[str] = Field(None, description="The specific model to use for the LLM provider.")
     llm_instance: Optional[BaseLLM] = Field(None, description="The LLM instance to use.")
     json_output: bool = Field(False, description="Whether to format the response as JSON.")
-    api: bool = Field(False, description="Whether to generate an API for the assistant.")
+    api: bool = Field(False, description="Whether to generate an API for the agent.")
     api_config: Optional[Dict] = Field(
         None,
         description="Configuration for the API (e.g., host, port, authentication).",
@@ -46,7 +46,7 @@ class Assistant(BaseModel):
     api_generator: Optional[Any] = Field(None, description="The API generator instance.")
     expected_output: Optional[Union[str, Dict]] = Field(None, description="The expected format or structure of the output.")
     semantic_model: Optional[Any] = Field(None, description="SentenceTransformer model for semantic matching.")
-    team: Optional[List['Assistant']] = Field(None, description="List of assistants in the team.")
+    team: Optional[List['Agent']] = Field(None, description="List of assistants in the team.")
     auto_tool: bool = Field(False, description="Whether to automatically detect and call tools.")
     # Allow arbitrary types
@@ -56,8 +56,11 @@ class Assistant(BaseModel):
         super().__init__(**kwargs)
         # Initialize the model and tools here if needed
         self._initialize_model()
-        # Automatically discover and register tools if not provided
+        # Initialize tools as an empty list if not provided
         if self.tools is None:
+            self.tools = []
+        # Automatically discover and register tools if auto tool is enabled
+        if self.auto_tool and not self.tools:
             self.tools = self._discover_tools()
         # Pass the LLM instance to each tool
         for tool in self.tools:
@@ -125,7 +128,7 @@ class Assistant(BaseModel):
             try:
                 # Import the module
                 module_name = file.stem
-                module = importlib.import_module(f"hashai.tools.{module_name}")
+                module = importlib.import_module(f"semantio.tools.{module_name}")
                 # Find all classes that inherit from BaseTool
                 for name, obj in module.__dict__.items():
@@ -197,7 +200,7 @@ class Assistant(BaseModel):
         model_to_use = self.llm_model or default_model
         # Dynamically import and initialize the LLM class
-        module_name = f"hashai.llm.{llm_provider}"
+        module_name = f"semantio.llm.{llm_provider}"
         llm_module = importlib.import_module(module_name)
         llm_class = getattr(llm_module, llm_class_name)
         self.llm_instance = llm_class(model=model_to_use, api_key=api_key)
@@ -213,11 +216,10 @@ class Assistant(BaseModel):
         message: Optional[Union[str, Image, List, Dict]] = None,
         stream: bool = False,
         markdown: bool = False,
-        tools: Optional[List[BaseTool]] = None,
-        team: Optional[List['Assistant']] = None,
+        team: Optional[List['Agent']] = None,
         **kwargs,
     ) -> Union[str, Dict]:  # Add return type hint
-        """Print the assistant's response to the console and return it."""
+        """Print the agent's response to the console and return it."""
         if stream:
             # Handle streaming response
@@ -228,60 +230,23 @@ class Assistant(BaseModel):
             return response
         else:
             # Generate and return the response
-            response = self._generate_response(message, markdown=markdown, tools=tools, team=team, **kwargs)
+            response = self._generate_response(message, markdown=markdown, team=team, **kwargs)
             print(response)  # Print the response to the console
             return response
     def _stream_response(self, message: str, markdown: bool = False, **kwargs) -> Iterator[str]:
-        """Stream the assistant's response."""
+        """Stream the agent's response."""
         # Simulate streaming by yielding chunks of the response
         response = self._generate_response(message, markdown=markdown, **kwargs)
         for chunk in response.split():
             yield chunk + " "
     def register_tool(self, tool: BaseTool):
-        """Register a tool for the assistant."""
+        """Register a tool for the agent."""
         if self.tools is None:
             self.tools = []
         self.tools.append(tool)
-    def _detect_tool_call(self, message: str) -> Optional[Dict[str, Any]]:
-        """
-        Use the LLM to detect which tool should be called based on the user's query.
-        """
-        if not self.tools:
-            logger.warning("No tools available to detect.")
-            return None
-        # Create a prompt for the LLM
-        prompt = f"""
-        You are an AI assistant that helps users by selecting the most appropriate tool to answer their query. Below is a list of available tools and their functionalities:
-        {self._get_tool_descriptions()}
-        Based on the user's query, select the most appropriate tool. Respond with the name of the tool (e.g., "CryptoPriceChecker"). If no tool is suitable, respond with "None".
-        User Query: "{message}"
-        """
-        try:
-            # Call the LLM to generate the response
-            response = self.llm_instance.generate(prompt=prompt)
-            tool_name = response.strip().replace('"', '').replace("'", "")
-            # Find the tool in the list of available tools
-            tool = next((t for t in self.tools if t.name.lower() == tool_name.lower()), None)
-            if tool:
-                logger.info(f"Detected tool call: {tool.name}")
-                return {
-                    "tool": tool.name,
-                    "input": {"query": message}
-                }
-        except Exception as e:
-            logger.error(f"Failed to detect tool call: {e}")
-        return None
     def _analyze_query_and_select_tools(self, query: str) -> List[Dict[str, Any]]:
         """
@@ -290,7 +255,7 @@ class Assistant(BaseModel):
         """
         # Create a prompt for the LLM to analyze the query and select tools
         prompt = f"""
-        You are an AI assistant that helps analyze user queries and select the most appropriate tools.
+        You are an AI agent that helps analyze user queries and select the most appropriate tools.
         Below is a list of available tools and their functionalities:
         {self._get_tool_descriptions()}
@@ -324,17 +289,16 @@ class Assistant(BaseModel):
             return []
-    def _generate_response(self, message: str, markdown: bool = False, tools: Optional[List[BaseTool]] = None, team: Optional[List['Assistant']] = None, **kwargs) -> str:
-        """Generate the assistant's response, including tool execution and context retrieval."""
-        # Use the specified tools or team if provided
-        if tools is not None:
-            self.tools = tools
+    def _generate_response(self, message: str, markdown: bool = False, team: Optional[List['Agent']] = None, **kwargs) -> str:
+        """Generate the agent's response, including tool execution and context retrieval."""
+        # Use the specified team if provided
         if team is not None:
             return self._generate_team_response(message, team, markdown=markdown, **kwargs)
         # Initialize tool_outputs as an empty dictionary
         tool_outputs = {}
         responses = []
+        tool_calls = []
         # Use the LLM to analyze the query and dynamically select tools when auto_tool is enabled
         if self.auto_tool:
@@ -344,7 +308,7 @@ class Assistant(BaseModel):
             if self.tools:
                 tool_calls = [
                     {
-                        "tool": tool.__class__.__name__,
+                        "tool": tool.name,
                         "input": {
                             "query": message,  # Use the message as the query
                             "context": None,  # No context provided by default
@@ -352,10 +316,8 @@ class Assistant(BaseModel):
                     }
                     for tool in self.tools
                 ]
-            else:
-                tool_calls = kwargs.get("tool_calls", [])
-            # Execute tools if any are detected
+        # Execute tools if any are detected
         if tool_calls:
             for tool_call in tool_calls:
                 tool_name = tool_call["tool"]
@@ -396,7 +358,7 @@ class Assistant(BaseModel):
             except Exception as e:
                 logger.error(f"Failed to generate LLM response: {e}")
                 responses.append(f"An error occurred while generating the analysis: {e}")
-        if not tool_calls:
+        if not self.tools and not tool_calls:
             # If no tools were executed, proceed with the original logic
             # Retrieve relevant context using RAG
             rag_context = self.rag.retrieve(message) if self.rag else None
@@ -435,12 +397,12 @@ class Assistant(BaseModel):
         # Combine all responses into a single string
         return "\n\n".join(responses)
-    def _generate_team_response(self, message: str, team: List['Assistant'], markdown: bool = False, **kwargs) -> str:
+    def _generate_team_response(self, message: str, team: List['Agent'], markdown: bool = False, **kwargs) -> str:
         """Generate a response using a team of assistants."""
         responses = []
-        for assistant in team:
-            response = assistant.print_response(message, markdown=markdown, **kwargs)
-            responses.append(f"**{assistant.name}:**\n\n{response}")
+        for agent in team:
+            response = agent.print_response(message, markdown=markdown, **kwargs)
+            responses.append(f"**{agent.name}:**\n\n{response}")
         return "\n\n".join(responses)
     def _build_prompt(self, message: str, context: Optional[List[Dict]]) -> str:
@@ -578,7 +540,7 @@ class Assistant(BaseModel):
         exit_on: Optional[List[str]] = None,
         **kwargs,
     ):
-        """Run the assistant in a CLI app."""
+        """Run the agent in a CLI app."""
         from rich.prompt import Prompt
         if message:
@@ -593,15 +555,15 @@ class Assistant(BaseModel):
             self.print_response(message=message, **kwargs)
     def _generate_api(self):
-        """Generate an API for the assistant if api=True."""
+        """Generate an API for the agent if api=True."""
         from .api.api_generator import APIGenerator
         self.api_generator = APIGenerator(self)
-        print(f"API generated for assistant '{self.name}'. Use `.run_api()` to start the API server.")
+        print(f"API generated for agent '{self.name}'. Use `.run_api()` to start the API server.")
     def run_api(self):
-        """Run the API server for the assistant."""
+        """Run the API server for the agent."""
         if not hasattr(self, 'api_generator'):
-            raise ValueError("API is not enabled for this assistant. Set `api=True` when initializing the assistant.")
+            raise ValueError("API is not enabled for this agent. Set `api=True` when initializing the agent.")
         # Get API configuration
         host = self.api_config.get("host", "0.0.0.0") if self.api_config else "0.0.0.0"

{semantio-0.0.2 → semantio-0.0.4}/semantio/cli/main.py RENAMED Viewed

@@ -1,7 +1,7 @@
 import argparse
 import warnings
-from hashai.assistant import Assistant
-from hashai.llm import get_llm
+from semantio.agent import Agent
+from semantio.llm import get_llm
 from urllib3.exceptions import NotOpenSSLWarning
 # Suppress the NotOpenSSLWarning
@@ -9,7 +9,7 @@ warnings.filterwarnings("ignore", category=NotOpenSSLWarning)
 def main():
     parser = argparse.ArgumentParser(description="opAi CLI")
-    parser.add_argument("--message", type=str, required=True, help="Message to send to the assistant")
+    parser.add_argument("--message", type=str, required=True, help="Message to send to the agent")
     parser.add_argument("--provider", type=str, required=True, help="LLM provider (e.g., groq, openai)")
     parser.add_argument("--api-key", type=str, required=True, help="API key for the LLM provider")
     parser.add_argument("--model", type=str, default=None, help="Model name (e.g., mixtral-8x7b-32768)")
@@ -22,9 +22,9 @@ def main():
     llm = get_llm(provider=args.provider, **llm_config)
-    # Create an assistant
-    assistant = Assistant(model=args.provider, llm=llm)
-    assistant.print_response(args.message)
+    # Create an agent
+    agent = Agent(model=args.provider, llm=llm)
+    agent.print_response(args.message)
 if __name__ == "__main__":

semantio-0.0.4/semantio/tools/web_browser.py ADDED Viewed

@@ -0,0 +1,271 @@
+# web_browser.py
+from typing import Dict, Any, List, Optional
+from pydantic import Field, BaseModel
+from selenium import webdriver
+from selenium.webdriver.common.by import By
+from selenium.webdriver.support.ui import WebDriverWait
+from selenium.webdriver.support import expected_conditions as EC
+from selenium.webdriver.chrome.options import Options
+from selenium.webdriver.chrome.service import Service
+from webdriver_manager.chrome import ChromeDriverManager
+from bs4 import BeautifulSoup
+import json
+import time
+import re
+import logging
+from .base_tool import BaseTool
+logger = logging.getLogger(__name__)
+class BrowserPlan(BaseModel):
+    tasks: List[Dict[str, Any]] = Field(
+        ...,
+        description="List of automation tasks to execute"
+    )
+class WebBrowserTool(BaseTool):
+    name: str = Field("WebBrowser", description="Name of the tool")
+    description: str = Field(
+        "Universal web automation tool for dynamic website interactions",
+        description="Tool description"
+    )
+    def execute(self, input: Dict[str, Any]) -> Dict[str, Any]:
+        """Execute dynamic web automation workflow"""
+        driver = None
+        try:
+            driver = self._init_browser(input.get("headless", False))
+            results = []
+            current_url = ""
+            # Generate initial plan
+            plan = self._generate_plan(input['query'], current_url)
+            for task in plan.tasks:
+                result = self._execute_safe_task(driver, task)
+                results.append(result)
+                if not result['success']:
+                    break
+                # Update context for next tasks
+                current_url = driver.current_url
+            return {"status": "success", "results": results}
+        except Exception as e:
+            return {"status": "error", "message": str(e)}
+        finally:
+            if driver:
+                driver.quit()
+    def _init_browser(self, headless: bool) -> webdriver.Chrome:
+        """Initialize browser with advanced options"""
+        options = Options()
+        options.add_argument("--start-maximized")
+        options.add_argument("--disable-blink-features=AutomationControlled")
+        options.add_experimental_option("excludeSwitches", ["enable-automation"])
+        if headless:
+            options.add_argument("--headless=new")
+        return webdriver.Chrome(
+            service=Service(ChromeDriverManager().install()),
+            options=options
+        )
+    def _generate_plan(self, query: str, current_url: str) -> BrowserPlan:
+        """Generate adaptive execution plan using LLM"""
+        prompt = f"""Generate browser automation plan for: {query}
+        Current URL: {current_url or 'No page loaded yet'}
+        Required JSON format:
+        {{
+            "tasks": [
+                {{
+                    "action": "navigate|click|type|wait|scroll",
+                    "selector": "CSS selector (optional)",
+                    "value": "input text/URL/seconds",
+                    "description": "action purpose"
+                }}
+            ]
+        }}
+        Guidelines:
+        1. Prefer IDs in selectors (#element-id)
+        2. Use semantic attributes (aria-label, name)
+        3. Include wait steps after navigation
+        4. Prioritize visible elements
+        5. Add scroll steps for hidden elements
+        """
+        response = self.llm.generate(prompt=prompt)
+        return self._parse_plan(response)
+    def _parse_plan(self, response: str) -> BrowserPlan:
+        """Robust JSON parsing with multiple fallback strategies"""
+        try:
+            # Try extracting JSON from markdown code block
+            json_match = re.search(r'```json\n?(.+?)\n?```', response, re.DOTALL)
+            if json_match:
+                plan_data = json.loads(json_match.group(1).strip())
+            else:
+                # Fallback to extract first JSON object
+                json_str = re.search(r'\{.*\}', response, re.DOTALL).group()
+                plan_data = json.loads(json_str)
+            # Validate tasks structure
+            validated_tasks = []
+            for task in plan_data.get("tasks", []):
+                if not all(key in task for key in ["action", "description"]):
+                    continue
+                validated_tasks.append({
+                    "action": task["action"],
+                    "selector": task.get("selector", ""),
+                    "value": task.get("value", ""),
+                    "description": task["description"]
+                })
+            return BrowserPlan(tasks=validated_tasks)
+        except (json.JSONDecodeError, AttributeError) as e:
+            logger.error(f"Plan parsing failed: {e}")
+            return BrowserPlan(tasks=[])
+    def _execute_safe_task(self, driver, task: Dict) -> Dict[str, Any]:
+        """Execute task with comprehensive error handling"""
+        try:
+            action = task["action"].lower()
+            selector = task.get("selector", "")
+            value = task.get("value", "")
+            if action == "navigate":
+                return self._handle_navigation(driver, value)
+            elif action == "click":
+                return self._handle_click(driver, selector)
+            elif action == "type":
+                return self._handle_typing(driver, selector, value)
+            elif action == "wait":
+                return self._handle_wait(value)
+            elif action == "scroll":
+                return self._handle_scroll(driver, selector)
+            return {
+                "action": action,
+                "success": False,
+                "message": f"Unsupported action: {action}"
+            }
+        except Exception as e:
+            return {
+                "action": action,
+                "success": False,
+                "message": f"Critical error: {str(e)}"
+            }
+    def _handle_navigation(self, driver, url: str) -> Dict[str, Any]:
+        """Smart navigation handler"""
+        if not url.startswith(("http://", "https://")):
+            url = f"https://{url}"
+        try:
+            driver.get(url)
+            WebDriverWait(driver, 15).until(
+                EC.presence_of_element_located((By.TAG_NAME, "body"))
+            )
+            return {
+                "action": "navigate",
+                "success": True,
+                "message": f"Navigated to {url}"
+            }
+        except Exception as e:
+            return {
+                "action": "navigate",
+                "success": False,
+                "message": f"Navigation failed: {str(e)}"
+            }
+    def _handle_click(self, driver, selector: str) -> Dict[str, Any]:
+        """Dynamic click handler"""
+        try:
+            element = WebDriverWait(driver, 15).until(
+                EC.element_to_be_clickable((By.CSS_SELECTOR, selector))
+            )
+            driver.execute_script("arguments[0].scrollIntoView({behavior: 'smooth'});", element)
+            element.click()
+            return {
+                "action": "click",
+                "success": True,
+                "message": f"Clicked element: {selector}"
+            }
+        except Exception as e:
+            return {
+                "action": "click",
+                "success": False,
+                "message": f"Click failed: {str(e)}"
+            }
+    def _handle_typing(self, driver, selector: str, text: str) -> Dict[str, Any]:
+        """Universal typing handler"""
+        try:
+            element = WebDriverWait(driver, 15).until(
+                EC.presence_of_element_located((By.CSS_SELECTOR, selector))
+            )
+            element.clear()
+            element.send_keys(text)
+            return {
+                "action": "type",
+                "success": True,
+                "message": f"Typed '{text}' into {selector}"
+            }
+        except Exception as e:
+            return {
+                "action": "type",
+                "success": False,
+                "message": f"Typing failed: {str(e)}"
+            }
+    def _handle_wait(self, seconds: str) -> Dict[str, Any]:
+        """Configurable wait handler"""
+        try:
+            wait_time = float(seconds)
+            time.sleep(wait_time)
+            return {
+                "action": "wait",
+                "success": True,
+                "message": f"Waited {wait_time} seconds"
+            }
+        except ValueError:
+            return {
+                "action": "wait",
+                "success": False,
+                "message": "Invalid wait time"
+            }
+    def _handle_scroll(self, driver, selector: str) -> Dict[str, Any]:
+        """Smart scroll handler"""
+        try:
+            if selector:
+                element = WebDriverWait(driver, 15).until(
+                    EC.presence_of_element_located((By.CSS_SELECTOR, selector))
+                )
+                driver.execute_script("arguments[0].scrollIntoView({behavior: 'smooth'});", element)
+            else:
+                driver.execute_script("window.scrollTo(0, document.body.scrollHeight);")
+            return {
+                "action": "scroll",
+                "success": True,
+                "message": f"Scrolled to {selector or 'page bottom'}"
+            }
+        except Exception as e:
+            return {
+                "action": "scroll",
+                "success": False,
+                "message": f"Scroll failed: {str(e)}"
+            }

{semantio-0.0.2 → semantio-0.0.4}/semantio.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: semantio
-Version: 0.0.2
+Version: 0.0.4
 Summary: A powerful SDK for building AI agents
 Home-page: https://github.com/Syenah/semantio
 Author: Rakesh

{semantio-0.0.2 → semantio-0.0.4}/semantio.egg-info/SOURCES.txt RENAMED Viewed

@@ -36,6 +36,7 @@ semantio/tools/base_tool.py
 semantio/tools/crypto.py
 semantio/tools/duckduckgo.py
 semantio/tools/stocks.py
+semantio/tools/web_browser.py
 semantio/utils/__init__.py
 semantio/utils/config.py
 semantio/utils/date_utils.py

{semantio-0.0.2 → semantio-0.0.4}/semantio.egg-info/requires.txt RENAMED Viewed

@@ -15,3 +15,7 @@ sentence-transformers
 fuzzywuzzy
 duckduckgo-search
 yfinance
+selenium
+beautifulsoup4
+webdriver-manager
+validators

{semantio-0.0.2 → semantio-0.0.4}/setup.py RENAMED Viewed

@@ -2,7 +2,7 @@ from setuptools import setup, find_packages
 setup(
     name="semantio",
-    version="0.0.2",
+    version="0.0.4",
     description="A powerful SDK for building AI agents",
     long_description=open("README.md").read(),
     long_description_content_type="text/markdown",
@@ -28,6 +28,10 @@ setup(
         "fuzzywuzzy", # For fuzzy string matching
         "duckduckgo-search", # For DuckDuckGo search
         "yfinance",   # For stock/crypto prices
+        "selenium",   # For web scraping
+        "beautifulsoup4", # For HTML parsing
+        "webdriver-manager", # For browser automation
+        "validators", # For URL validation
     ],
     classifiers=[