PyPI - swarms - Versions diffs - 7.8.3__py3-none-any.whl → 7.8.7__py3-none-any.whl - Mend

swarms 7.8.3py3-none-any.whl → 7.8.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

swarms/agents/ape_agent.py +5 -22
swarms/agents/consistency_agent.py +1 -1
swarms/agents/i_agent.py +1 -1
swarms/agents/reasoning_agents.py +99 -3
swarms/agents/reasoning_duo.py +1 -1
swarms/cli/main.py +1 -1
swarms/communication/__init__.py +1 -0
swarms/communication/duckdb_wrap.py +32 -2
swarms/communication/pulsar_struct.py +45 -19
swarms/communication/redis_wrap.py +56 -11
swarms/communication/supabase_wrap.py +1659 -0
swarms/prompts/agent_conversation_aggregator.py +38 -0
swarms/prompts/prompt.py +0 -3
swarms/schemas/agent_completion_response.py +71 -0
swarms/schemas/agent_rag_schema.py +7 -0
swarms/schemas/conversation_schema.py +9 -0
swarms/schemas/llm_agent_schema.py +99 -81
swarms/schemas/swarms_api_schemas.py +164 -0
swarms/structs/__init__.py +15 -9
swarms/structs/agent.py +219 -199
swarms/structs/agent_rag_handler.py +685 -0
swarms/structs/base_swarm.py +2 -1
swarms/structs/conversation.py +832 -264
swarms/structs/csv_to_agent.py +153 -100
swarms/structs/deep_research_swarm.py +197 -193
swarms/structs/dynamic_conversational_swarm.py +18 -7
swarms/structs/hiearchical_swarm.py +1 -1
swarms/structs/hybrid_hiearchical_peer_swarm.py +2 -18
swarms/structs/image_batch_processor.py +261 -0
swarms/structs/interactive_groupchat.py +356 -0
swarms/structs/ma_blocks.py +159 -0
swarms/structs/majority_voting.py +1 -1
swarms/structs/mixture_of_agents.py +1 -1
swarms/structs/multi_agent_exec.py +25 -26
swarms/structs/multi_agent_router.py +3 -2
swarms/structs/rearrange.py +3 -3
swarms/structs/sequential_workflow.py +3 -3
swarms/structs/swarm_matcher.py +499 -408
swarms/structs/swarm_router.py +15 -97
swarms/structs/swarming_architectures.py +1 -1
swarms/tools/mcp_client_call.py +3 -0
swarms/utils/__init__.py +10 -2
swarms/utils/check_all_model_max_tokens.py +43 -0
swarms/utils/generate_keys.py +0 -27
swarms/utils/history_output_formatter.py +5 -20
swarms/utils/litellm_wrapper.py +208 -60
swarms/utils/output_types.py +24 -0
swarms/utils/vllm_wrapper.py +14 -13
swarms/utils/xml_utils.py +37 -2
{swarms-7.8.3.dist-info → swarms-7.8.7.dist-info}/METADATA +31 -55
{swarms-7.8.3.dist-info → swarms-7.8.7.dist-info}/RECORD +55 -48
swarms/structs/multi_agent_collab.py +0 -242
swarms/structs/output_types.py +0 -6
swarms/utils/markdown_message.py +0 -21
swarms/utils/visualizer.py +0 -510
swarms/utils/wrapper_clusterop.py +0 -127
/swarms/{tools → schemas}/tool_schema_base_model.py +0 -0
{swarms-7.8.3.dist-info → swarms-7.8.7.dist-info}/LICENSE +0 -0
{swarms-7.8.3.dist-info → swarms-7.8.7.dist-info}/WHEEL +0 -0
{swarms-7.8.3.dist-info → swarms-7.8.7.dist-info}/entry_points.txt +0 -0

swarms/utils/litellm_wrapper.py CHANGED Viewed

@@ -1,6 +1,8 @@
+import traceback
 from typing import Optional
 import base64
 import requests
+from pathlib import Path
 import asyncio
 from typing import List
@@ -9,11 +11,7 @@ from loguru import logger
 import litellm
 from pydantic import BaseModel
-from litellm import completion, acompletion
-litellm.set_verbose = True
-litellm.ssl_verify = False
-# litellm._turn_on_debug()
+from litellm import completion, acompletion, supports_vision
 class LiteLLMException(Exception):
@@ -53,6 +51,35 @@ def get_audio_base64(audio_source: str) -> str:
     return encoded_string
+def get_image_base64(image_source: str) -> str:
+    """
+    Convert image from a given source to a base64 encoded string.
+    Handles URLs, local file paths, and data URIs.
+    """
+    # If already a data URI, return as is
+    if image_source.startswith("data:image"):
+        return image_source
+    # Handle URL
+    if image_source.startswith(("http://", "https://")):
+        response = requests.get(image_source)
+        response.raise_for_status()
+        image_data = response.content
+    # Handle local file
+    else:
+        with open(image_source, "rb") as file:
+            image_data = file.read()
+    # Get file extension for mime type
+    extension = Path(image_source).suffix.lower()
+    mime_type = (
+        f"image/{extension[1:]}" if extension else "image/jpeg"
+    )
+    encoded_string = base64.b64encode(image_data).decode("utf-8")
+    return f"data:{mime_type};base64,{encoded_string}"
 class LiteLLM:
     """
     This class represents a LiteLLM.
@@ -72,12 +99,15 @@ class LiteLLM:
         tool_choice: str = "auto",
         parallel_tool_calls: bool = False,
         audio: str = None,
-        retries: int = 3,
+        retries: int = 0,
         verbose: bool = False,
         caching: bool = False,
         mcp_call: bool = False,
         top_p: float = 1.0,
         functions: List[dict] = None,
+        return_all: bool = False,
+        base_url: str = None,
+        api_key: str = None,
         *args,
         **kwargs,
     ):
@@ -105,8 +135,11 @@ class LiteLLM:
         self.mcp_call = mcp_call
         self.top_p = top_p
         self.functions = functions
+        self.audio = audio
+        self.return_all = return_all
+        self.base_url = base_url
+        self.api_key = api_key
         self.modalities = []
-        self._cached_messages = {}  # Cache for prepared messages
         self.messages = []  # Initialize messages list
         # Configure litellm settings
@@ -135,7 +168,11 @@ class LiteLLM:
                 out = out.model_dump()
             return out
-    def _prepare_messages(self, task: str) -> list:
+    def _prepare_messages(
+        self,
+        task: str,
+        img: str = None,
+    ):
         """
         Prepare the messages for the given task.
@@ -145,91 +182,201 @@ class LiteLLM:
         Returns:
             list: A list of messages prepared for the task.
         """
-        # Check cache first
-        cache_key = f"{self.system_prompt}:{task}"
-        if cache_key in self._cached_messages:
-            return self._cached_messages[cache_key].copy()
+        self.check_if_model_supports_vision(img=img)
+        # Initialize messages
         messages = []
-        if self.system_prompt:
+        # Add system prompt if present
+        if self.system_prompt is not None:
             messages.append(
                 {"role": "system", "content": self.system_prompt}
             )
-        messages.append({"role": "user", "content": task})
-        # Cache the prepared messages
-        self._cached_messages[cache_key] = messages.copy()
+        # Handle vision case
+        if img is not None:
+            messages = self.vision_processing(
+                task=task, image=img, messages=messages
+            )
+        else:
+            messages.append({"role": "user", "content": task})
         return messages
-    def audio_processing(self, task: str, audio: str):
+    def anthropic_vision_processing(
+        self, task: str, image: str, messages: list
+    ) -> list:
         """
-        Process the audio for the given task.
-        Args:
-            task (str): The task to be processed.
-            audio (str): The path or identifier for the audio file.
+        Process vision input specifically for Anthropic models.
+        Handles Anthropic's specific image format requirements.
         """
-        self.modalities.append("audio")
-        encoded_string = get_audio_base64(audio)
+        # Get base64 encoded image
+        image_url = get_image_base64(image)
+        # Extract mime type from the data URI or use default
+        mime_type = "image/jpeg"  # default
+        if "data:" in image_url and ";base64," in image_url:
+            mime_type = image_url.split(";base64,")[0].split("data:")[
+                1
+            ]
+        # Ensure mime type is one of the supported formats
+        supported_formats = [
+            "image/jpeg",
+            "image/png",
+            "image/gif",
+            "image/webp",
+        ]
+        if mime_type not in supported_formats:
+            mime_type = (
+                "image/jpeg"  # fallback to jpeg if unsupported
+            )
-        # Append messages
-        self.messages.append(
+        # Construct Anthropic vision message
+        messages.append(
             {
                 "role": "user",
                 "content": [
                     {"type": "text", "text": task},
                     {
-                        "type": "input_audio",
-                        "input_audio": {
-                            "data": encoded_string,
-                            "format": "wav",
+                        "type": "image_url",
+                        "image_url": {
+                            "url": image_url,
+                            "format": mime_type,
                         },
                     },
                 ],
             }
         )
-    def vision_processing(self, task: str, image: str):
+        return messages
+    def openai_vision_processing(
+        self, task: str, image: str, messages: list
+    ) -> list:
+        """
+        Process vision input specifically for OpenAI models.
+        Handles OpenAI's specific image format requirements.
+        """
+        # Get base64 encoded image with proper format
+        image_url = get_image_base64(image)
+        # Prepare vision message
+        vision_message = {
+            "type": "image_url",
+            "image_url": {"url": image_url},
+        }
+        # Add format for specific models
+        extension = Path(image).suffix.lower()
+        mime_type = (
+            f"image/{extension[1:]}" if extension else "image/jpeg"
+        )
+        vision_message["image_url"]["format"] = mime_type
+        # Append vision message
+        messages.append(
+            {
+                "role": "user",
+                "content": [
+                    {"type": "text", "text": task},
+                    vision_message,
+                ],
+            }
+        )
+        return messages
+    def vision_processing(
+        self, task: str, image: str, messages: Optional[list] = None
+    ):
         """
         Process the image for the given task.
+        Handles different image formats and model requirements.
+        """
+        # # # Handle Anthropic models separately
+        # # if "anthropic" in self.model_name.lower() or "claude" in self.model_name.lower():
+        # #     messages = self.anthropic_vision_processing(task, image, messages)
+        # #     return messages
+        # # Get base64 encoded image with proper format
+        # image_url = get_image_base64(image)
+        # # Prepare vision message
+        # vision_message = {
+        #     "type": "image_url",
+        #     "image_url": {"url": image_url},
+        # }
+        # # Add format for specific models
+        # extension = Path(image).suffix.lower()
+        # mime_type = f"image/{extension[1:]}" if extension else "image/jpeg"
+        # vision_message["image_url"]["format"] = mime_type
+        # # Append vision message
+        # messages.append(
+        #     {
+        #         "role": "user",
+        #         "content": [
+        #             {"type": "text", "text": task},
+        #             vision_message,
+        #         ],
+        #     }
+        # )
+        # return messages
+        if (
+            "anthropic" in self.model_name.lower()
+            or "claude" in self.model_name.lower()
+        ):
+            messages = self.anthropic_vision_processing(
+                task, image, messages
+            )
+            return messages
+        else:
+            messages = self.openai_vision_processing(
+                task, image, messages
+            )
+            return messages
+    def audio_processing(self, task: str, audio: str):
         """
-        self.modalities.append("vision")
+        Process the audio for the given task.
-        # Append messages
+        Args:
+            task (str): The task to be processed.
+            audio (str): The path or identifier for the audio file.
+        """
+        encoded_string = get_audio_base64(audio)
+        # Append audio message
         self.messages.append(
             {
                 "role": "user",
                 "content": [
                     {"type": "text", "text": task},
                     {
-                        "type": "image_url",
-                        "image_url": {
-                            "url": image,
-                            # "detail": "high"
-                            # "format": "image",
+                        "type": "input_audio",
+                        "input_audio": {
+                            "data": encoded_string,
+                            "format": "wav",
                         },
                     },
                 ],
             }
         )
-    def handle_modalities(
-        self, task: str, audio: str = None, img: str = None
-    ):
+    def check_if_model_supports_vision(self, img: str = None):
         """
-        Handle the modalities for the given task.
+        Check if the model supports vision.
         """
-        self.messages = []  # Reset messages
-        self.modalities.append("text")
-        if audio is not None:
-            self.audio_processing(task=task, audio=audio)
-            self.modalities.append("audio")
         if img is not None:
-            self.vision_processing(task=task, image=img)
-            self.modalities.append("vision")
+            out = supports_vision(model=self.model_name)
+            if out is False:
+                raise ValueError(
+                    f"Model {self.model_name} does not support vision"
+                )
     def run(
         self,
@@ -256,13 +403,7 @@ class LiteLLM:
             Exception: If there is an error in processing the request.
         """
         try:
-            messages = self._prepare_messages(task)
-            if audio is not None or img is not None:
-                self.handle_modalities(
-                    task=task, audio=audio, img=img
-                )
-                messages = self.messages
+            messages = self._prepare_messages(task=task, img=img)
             # Base completion parameters
             completion_params = {
@@ -298,6 +439,9 @@ class LiteLLM:
                     {"functions": self.functions}
                 )
+            if self.base_url is not None:
+                completion_params["base_url"] = self.base_url
             # Add modalities if needed
             if self.modalities and len(self.modalities) >= 2:
                 completion_params["modalities"] = self.modalities
@@ -308,12 +452,16 @@ class LiteLLM:
             # Handle tool-based response
             if self.tools_list_dictionary is not None:
                 return self.output_for_tools(response)
+            elif self.return_all is True:
+                return response.model_dump()
             else:
                 # Return standard response content
                 return response.choices[0].message.content
         except LiteLLMException as error:
-            logger.error(f"Error in LiteLLM run: {str(error)}")
+            logger.error(
+                f"Error in LiteLLM run: {str(error)} Traceback: {traceback.format_exc()}"
+            )
             if "rate_limit" in str(error).lower():
                 logger.warning(
                     "Rate limit hit, retrying with exponential backoff..."

swarms/utils/output_types.py ADDED Viewed

@@ -0,0 +1,24 @@
+from typing import Literal
+HistoryOutputType = Literal[
+    "list",
+    "dict",
+    "dictionary",
+    "string",
+    "str",
+    "final",
+    "last",
+    "json",
+    "all",
+    "yaml",
+    "xml",
+    # "dict-final",
+    "dict-all-except-first",
+    "str-all-except-first",
+    "basemodel",
+    "dict-final",
+]
+OutputType = HistoryOutputType
+output_type: HistoryOutputType  # OutputType now includes 'xml'

swarms/utils/vllm_wrapper.py CHANGED Viewed

@@ -1,3 +1,5 @@
+import os
+import concurrent.futures
 from typing import List, Optional, Dict, Any
 from loguru import logger
@@ -131,16 +133,15 @@ class VLLMWrapper:
         Returns:
             List[str]: List of model responses.
         """
-        logger.info(
-            f"Running tasks in batches of size {batch_size}. Total tasks: {len(tasks)}"
-        )
-        results = []
-        for i in range(0, len(tasks), batch_size):
-            batch = tasks[i : i + batch_size]
-            for task in batch:
-                logger.info(f"Running task: {task}")
-                results.append(self.run(task))
-        logger.info("Completed all tasks.")
-        return results
+        # Calculate the worker count based on 95% of available CPU cores
+        num_workers = max(1, int((os.cpu_count() or 1) * 0.95))
+        with concurrent.futures.ThreadPoolExecutor(
+            max_workers=num_workers
+        ) as executor:
+            futures = [
+                executor.submit(self.run, task) for task in tasks
+            ]
+            return [
+                future.result()
+                for future in concurrent.futures.as_completed(futures)
+            ]

swarms/utils/xml_utils.py CHANGED Viewed

@@ -3,7 +3,22 @@ from typing import Any
 def dict_to_xml(tag: str, d: dict) -> ET.Element:
-    """Convert a dictionary to an XML Element."""
+    """
+    Convert a dictionary to an XML Element.
+    Args:
+        tag (str): The tag name for the root element
+        d (dict): The dictionary to convert to XML
+    Returns:
+        ET.Element: An XML Element representing the dictionary structure
+    Example:
+        >>> data = {"person": {"name": "John", "age": 30}}
+        >>> elem = dict_to_xml("root", data)
+        >>> ET.tostring(elem, encoding="unicode")
+        '<root><person><name>John</name><age>30</age></person></root>'
+    """
     elem = ET.Element(tag)
     for key, val in d.items():
         child = ET.Element(str(key))
@@ -24,7 +39,27 @@ def dict_to_xml(tag: str, d: dict) -> ET.Element:
 def to_xml_string(data: Any, root_tag: str = "root") -> str:
-    """Convert a dict or list to an XML string."""
+    """
+    Convert a dict or list to an XML string.
+    Args:
+        data (Any): The data to convert to XML. Can be a dictionary, list, or other value
+        root_tag (str, optional): The tag name for the root element. Defaults to "root"
+    Returns:
+        str: An XML string representation of the input data
+    Example:
+        >>> data = {"person": {"name": "John", "age": 30}}
+        >>> xml_str = to_xml_string(data)
+        >>> print(xml_str)
+        <root><person><name>John</name><age>30</age></person></root>
+        >>> data = [1, 2, 3]
+        >>> xml_str = to_xml_string(data)
+        >>> print(xml_str)
+        <root><item>1</item><item>2</item><item>3</item></root>
+    """
     if isinstance(data, dict):
         elem = dict_to_xml(root_tag, data)
     elif isinstance(data, list):

swarms 7.8.3__py3-none-any.whl → 7.8.7__py3-none-any.whl

swarms 7.8.3py3-none-any.whl → 7.8.7py3-none-any.whl