PyPI - autobyteus - Versions diffs - 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

autobyteus 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

autobyteus/agent/context/agent_config.py +6 -1
autobyteus/agent/context/agent_runtime_state.py +7 -1
autobyteus/agent/handlers/llm_user_message_ready_event_handler.py +30 -7
autobyteus/agent/handlers/tool_result_event_handler.py +100 -88
autobyteus/agent/handlers/user_input_message_event_handler.py +22 -25
autobyteus/agent/llm_response_processor/provider_aware_tool_usage_processor.py +7 -1
autobyteus/agent/message/__init__.py +7 -5
autobyteus/agent/message/agent_input_user_message.py +6 -16
autobyteus/agent/message/context_file.py +24 -24
autobyteus/agent/message/context_file_type.py +29 -8
autobyteus/agent/message/multimodal_message_builder.py +47 -0
autobyteus/agent/streaming/stream_event_payloads.py +23 -4
autobyteus/agent/system_prompt_processor/tool_manifest_injector_processor.py +6 -2
autobyteus/agent/tool_invocation.py +27 -2
autobyteus/agent_team/agent_team_builder.py +22 -1
autobyteus/agent_team/bootstrap_steps/agent_configuration_preparation_step.py +9 -2
autobyteus/agent_team/context/agent_team_config.py +1 -0
autobyteus/agent_team/context/agent_team_runtime_state.py +0 -2
autobyteus/llm/api/autobyteus_llm.py +33 -33
autobyteus/llm/api/bedrock_llm.py +13 -5
autobyteus/llm/api/claude_llm.py +13 -27
autobyteus/llm/api/gemini_llm.py +108 -42
autobyteus/llm/api/groq_llm.py +4 -3
autobyteus/llm/api/mistral_llm.py +97 -51
autobyteus/llm/api/nvidia_llm.py +6 -5
autobyteus/llm/api/ollama_llm.py +37 -12
autobyteus/llm/api/openai_compatible_llm.py +91 -91
autobyteus/llm/autobyteus_provider.py +1 -1
autobyteus/llm/base_llm.py +42 -139
autobyteus/llm/extensions/base_extension.py +6 -6
autobyteus/llm/extensions/token_usage_tracking_extension.py +3 -2
autobyteus/llm/llm_factory.py +131 -61
autobyteus/llm/ollama_provider_resolver.py +1 -0
autobyteus/llm/providers.py +1 -0
autobyteus/llm/token_counter/token_counter_factory.py +3 -1
autobyteus/llm/user_message.py +43 -35
autobyteus/llm/utils/llm_config.py +34 -18
autobyteus/llm/utils/media_payload_formatter.py +99 -0
autobyteus/llm/utils/messages.py +32 -25
autobyteus/llm/utils/response_types.py +9 -3
autobyteus/llm/utils/token_usage.py +6 -5
autobyteus/multimedia/__init__.py +31 -0
autobyteus/multimedia/audio/__init__.py +11 -0
autobyteus/multimedia/audio/api/__init__.py +4 -0
autobyteus/multimedia/audio/api/autobyteus_audio_client.py +59 -0
autobyteus/multimedia/audio/api/gemini_audio_client.py +219 -0
autobyteus/multimedia/audio/audio_client_factory.py +120 -0
autobyteus/multimedia/audio/audio_model.py +97 -0
autobyteus/multimedia/audio/autobyteus_audio_provider.py +108 -0
autobyteus/multimedia/audio/base_audio_client.py +40 -0
autobyteus/multimedia/image/__init__.py +11 -0
autobyteus/multimedia/image/api/__init__.py +9 -0
autobyteus/multimedia/image/api/autobyteus_image_client.py +97 -0
autobyteus/multimedia/image/api/gemini_image_client.py +188 -0
autobyteus/multimedia/image/api/openai_image_client.py +142 -0
autobyteus/multimedia/image/autobyteus_image_provider.py +109 -0
autobyteus/multimedia/image/base_image_client.py +67 -0
autobyteus/multimedia/image/image_client_factory.py +118 -0
autobyteus/multimedia/image/image_model.py +97 -0
autobyteus/multimedia/providers.py +5 -0
autobyteus/multimedia/runtimes.py +8 -0
autobyteus/multimedia/utils/__init__.py +10 -0
autobyteus/multimedia/utils/api_utils.py +19 -0
autobyteus/multimedia/utils/multimedia_config.py +29 -0
autobyteus/multimedia/utils/response_types.py +13 -0
autobyteus/task_management/tools/publish_task_plan.py +4 -16
autobyteus/task_management/tools/update_task_status.py +4 -19
autobyteus/tools/__init__.py +5 -4
autobyteus/tools/base_tool.py +98 -29
autobyteus/tools/browser/standalone/__init__.py +0 -1
autobyteus/tools/google_search.py +149 -0
autobyteus/tools/mcp/schema_mapper.py +29 -71
autobyteus/tools/multimedia/__init__.py +8 -0
autobyteus/tools/multimedia/audio_tools.py +116 -0
autobyteus/tools/multimedia/image_tools.py +186 -0
autobyteus/tools/parameter_schema.py +82 -89
autobyteus/tools/pydantic_schema_converter.py +81 -0
autobyteus/tools/tool_category.py +1 -0
autobyteus/tools/usage/formatters/default_json_example_formatter.py +89 -20
autobyteus/tools/usage/formatters/default_xml_example_formatter.py +115 -41
autobyteus/tools/usage/formatters/default_xml_schema_formatter.py +50 -20
autobyteus/tools/usage/formatters/gemini_json_example_formatter.py +55 -22
autobyteus/tools/usage/formatters/google_json_example_formatter.py +54 -21
autobyteus/tools/usage/formatters/openai_json_example_formatter.py +53 -23
autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py +270 -94
autobyteus/tools/usage/parsers/provider_aware_tool_usage_parser.py +5 -2
autobyteus/tools/usage/providers/tool_manifest_provider.py +43 -16
autobyteus/tools/usage/registries/tool_formatting_registry.py +9 -2
autobyteus/tools/usage/registries/tool_usage_parser_registry.py +9 -2
autobyteus-1.1.7.dist-info/METADATA +204 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/RECORD +98 -71
examples/run_browser_agent.py +1 -1
examples/run_google_slides_agent.py +2 -2
examples/run_mcp_google_slides_client.py +1 -1
examples/run_sqlite_agent.py +1 -1
autobyteus/llm/utils/image_payload_formatter.py +0 -89
autobyteus/tools/ask_user_input.py +0 -40
autobyteus/tools/browser/standalone/factory/google_search_factory.py +0 -25
autobyteus/tools/browser/standalone/google_search_ui.py +0 -126
autobyteus-1.1.5.dist-info/METADATA +0 -161
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/WHEEL +0 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/licenses/LICENSE +0 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/top_level.txt +0 -0

autobyteus/agent/message/context_file.py CHANGED Viewed

@@ -3,6 +3,7 @@ import os
 import logging
 from typing import Optional, Dict, Any
 from dataclasses import dataclass, field
+from urllib.parse import urlparse
 from .context_file_type import ContextFileType
@@ -12,10 +13,9 @@ logger = logging.getLogger(__name__)
 class ContextFile:
     """
     Represents a single context file provided to an agent.
-    This is a simple dataclass, deferring path validation and file access
-    to input processors.
+    The 'uri' can be a local file path or a network URL.
     """
-    path: str
+    uri: str
     file_type: ContextFileType = ContextFileType.UNKNOWN
     file_name: Optional[str] = None
     metadata: Dict[str, Any] = field(default_factory=dict)
@@ -25,33 +25,33 @@ class ContextFile:
         Called after the dataclass's __init__ method.
         Used here to infer file_name and file_type if not provided or UNKNOWN.
         """
-        if self.file_name is None and self.path:
+        if not isinstance(self.uri, str) or not self.uri:
+            raise TypeError(f"ContextFile uri must be a non-empty string, got {type(self.uri)}")
+        if self.file_name is None:
             try:
-                self.file_name = os.path.basename(self.path)
+                # Use urlparse to correctly handle both URLs and local paths
+                parsed_path = urlparse(self.uri).path
+                self.file_name = os.path.basename(parsed_path)
             except Exception as e:
-                logger.warning(f"Could not determine basename for path '{self.path}': {e}")
+                logger.warning(f"Could not determine basename for uri '{self.uri}': {e}")
                 self.file_name = "unknown_file"
-        if self.file_type == ContextFileType.UNKNOWN and self.path:
-            inferred_type = ContextFileType.from_path(self.path)
+        if self.file_type == ContextFileType.UNKNOWN:
+            inferred_type = ContextFileType.from_path(self.uri)
             if inferred_type != ContextFileType.UNKNOWN:
                 self.file_type = inferred_type
-                logger.debug(f"Inferred file type for '{self.path}' as {self.file_type.value}")
+                logger.debug(f"Inferred file type for '{self.uri}' as {self.file_type.value}")
             else:
-                logger.debug(f"Could not infer specific file type for '{self.path}', remaining UNKNOWN.")
-        # Ensure path is a string
-        if not isinstance(self.path, str):
-            # This ideally should be caught by type hints earlier, but as a runtime safeguard:
-            raise TypeError(f"ContextFile path must be a string, got {type(self.path)}")
+                logger.debug(f"Could not infer specific file type for '{self.uri}', remaining UNKNOWN.")
         if logger.isEnabledFor(logging.DEBUG):
-            logger.debug(f"ContextFile initialized: path='{self.path}', type='{self.file_type.value}', name='{self.file_name}'")
+            logger.debug(f"ContextFile initialized: uri='{self.uri}', type='{self.file_type.value}', name='{self.file_name}'")
     def to_dict(self) -> Dict[str, Any]:
         """Serializes the ContextFile to a dictionary."""
         return {
-            "path": self.path,
+            "uri": self.uri,
             "file_type": self.file_type.value, # Serialize enum to its value
             "file_name": self.file_name,
             "metadata": self.metadata,
@@ -60,23 +60,23 @@ class ContextFile:
     @classmethod
     def from_dict(cls, data: Dict[str, Any]) -> 'ContextFile':
         """Deserializes a ContextFile from a dictionary."""
-        if not isinstance(data.get("path"), str):
-            raise ValueError("ContextFile 'path' in dictionary must be a string.")
+        if not isinstance(data.get("uri"), str):
+            raise ValueError("ContextFile 'uri' in dictionary must be a string.")
         file_type_str = data.get("file_type", ContextFileType.UNKNOWN.value)
         try:
             file_type = ContextFileType(file_type_str)
         except ValueError:
             logger.warning(f"Invalid file_type string '{file_type_str}' in ContextFile data. Defaulting to UNKNOWN.")
             file_type = ContextFileType.UNKNOWN
         return cls(
-            path=data["path"],
+            uri=data["uri"],
             file_type=file_type,
             file_name=data.get("file_name"),
             metadata=data.get("metadata", {})
         )
     def __repr__(self) -> str:
-        return (f"ContextFile(path='{self.path}', file_name='{self.file_name}', "
+        return (f"ContextFile(uri='{self.uri}', file_name='{self.file_name}', "
                 f"file_type='{self.file_type.value}', metadata_keys={list(self.metadata.keys())})")

autobyteus/agent/message/context_file_type.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from enum import Enum
 import os
+from urllib.parse import urlparse
 class ContextFileType(str, Enum):
     """
@@ -23,19 +24,25 @@ class ContextFileType(str, Enum):
     UNKNOWN = "unknown"    # Fallback for unrecognized types
     @classmethod
-    def from_path(cls, file_path: str) -> 'ContextFileType':
+    def from_path(cls, uri: str) -> 'ContextFileType':
         """
-        Infers the ContextFileType from a file path based on its extension.
+        Infers the ContextFileType from a file path or URL based on its extension.
         """
-        if not file_path or not isinstance(file_path, str):
+        if not uri or not isinstance(uri, str):
             return cls.UNKNOWN
-        _, extension = os.path.splitext(file_path.lower())
+        try:
+            # Parse the URI to handle both file paths and URLs gracefully
+            parsed_path = urlparse(uri).path
+            _, extension = os.path.splitext(parsed_path.lower())
+        except Exception:
+            # Fallback for malformed URIs
+            _, extension = os.path.splitext(uri.lower())
         if extension == ".txt":
             return cls.TEXT
         elif extension == ".md":
-            return cls.MARKDOWN
+            return cls.MARKDOWN
         elif extension == ".pdf":
             return cls.PDF
         elif extension == ".docx":
@@ -61,9 +68,23 @@ class ContextFileType(str, Enum):
         elif extension in [".mp4", ".mov", ".avi", ".mkv", ".webm"]:
             return cls.VIDEO
         elif extension in [".png", ".jpg", ".jpeg", ".gif", ".webp"]:
-            return cls.IMAGE
+            return cls.IMAGE
         else:
             return cls.UNKNOWN
+    @classmethod
+    def get_readable_text_types(cls) -> list['ContextFileType']:
+        """Returns a list of file types that can be read as plain text for context."""
+        return [
+            cls.TEXT,
+            cls.MARKDOWN,
+            cls.JSON,
+            cls.XML,
+            cls.HTML,
+            cls.PYTHON,
+            cls.JAVASCRIPT,
+            cls.CSV,
+        ]
     def __str__(self) -> str:
         return self.value

autobyteus/agent/message/multimodal_message_builder.py ADDED Viewed

@@ -0,0 +1,47 @@
+# file: autobyteus/autobyteus/agent/message/multimodal_message_builder.py
+import logging
+from autobyteus.agent.message.agent_input_user_message import AgentInputUserMessage
+from autobyteus.agent.message.context_file_type import ContextFileType
+from autobyteus.llm.user_message import LLMUserMessage
+logger = logging.getLogger(__name__)
+def build_llm_user_message(agent_input_user_message: AgentInputUserMessage) -> LLMUserMessage:
+    """
+    Builds an LLMUserMessage from an AgentInputUserMessage by categorizing its context files.
+    This function iterates through the context files, sorting URIs for images, audio, and video
+    into the appropriate fields of the LLMUserMessage. It ignores other file types for now.
+    Args:
+        agent_input_user_message: The user input message containing content and context files.
+    Returns:
+        An LLMUserMessage ready to be sent to the LLM.
+    """
+    image_urls = []
+    audio_urls = []
+    video_urls = []
+    if agent_input_user_message.context_files:
+        for context_file in agent_input_user_message.context_files:
+            file_type = context_file.file_type
+            if file_type == ContextFileType.IMAGE:
+                image_urls.append(context_file.uri)
+            elif file_type == ContextFileType.AUDIO:
+                audio_urls.append(context_file.uri)
+            elif file_type == ContextFileType.VIDEO:
+                video_urls.append(context_file.uri)
+            else:
+                logger.debug(f"Ignoring non-media context file of type '{file_type.value}' during LLM message build: {context_file.uri}")
+    llm_user_message = LLMUserMessage(
+        content=agent_input_user_message.content,
+        image_urls=image_urls if image_urls else None,
+        audio_urls=audio_urls if audio_urls else None,
+        video_urls=video_urls if video_urls else None
+    )
+    logger.info(f"Built LLMUserMessage with {len(image_urls)} images, {len(audio_urls)} audio, {len(video_urls)} video files.")
+    return llm_user_message

autobyteus/agent/streaming/stream_event_payloads.py CHANGED Viewed

@@ -20,12 +20,18 @@ class AssistantChunkData(BaseStreamPayload):
     reasoning: Optional[str] = None
     is_complete: bool
     usage: Optional[TokenUsage] = None
+    image_urls: Optional[List[str]] = None
+    audio_urls: Optional[List[str]] = None
+    video_urls: Optional[List[str]] = None
 class AssistantCompleteResponseData(BaseStreamPayload):
     content: str
     reasoning: Optional[str] = None
     usage: Optional[TokenUsage] = None
+    image_urls: Optional[List[str]] = None
+    audio_urls: Optional[List[str]] = None
+    video_urls: Optional[List[str]] = None
 class ToolInteractionLogEntryData(BaseStreamPayload):
     log_entry: str
@@ -102,14 +108,20 @@ def create_assistant_chunk_data(chunk_obj: Any) -> AssistantChunkData:
             content=str(getattr(chunk_obj, 'content', '')),
             reasoning=getattr(chunk_obj, 'reasoning', None),
             is_complete=bool(getattr(chunk_obj, 'is_complete', False)),
-            usage=parsed_usage
+            usage=parsed_usage,
+            image_urls=getattr(chunk_obj, 'image_urls', None),
+            audio_urls=getattr(chunk_obj, 'audio_urls', None),
+            video_urls=getattr(chunk_obj, 'video_urls', None)
         )
     elif isinstance(chunk_obj, dict):
          return AssistantChunkData(
             content=str(chunk_obj.get('content', '')),
             reasoning=chunk_obj.get('reasoning', None),
             is_complete=bool(chunk_obj.get('is_complete', False)),
-            usage=parsed_usage
+            usage=parsed_usage,
+            image_urls=chunk_obj.get('image_urls', None),
+            audio_urls=chunk_obj.get('audio_urls', None),
+            video_urls=chunk_obj.get('video_urls', None)
         )
     raise ValueError(f"Cannot create AssistantChunkData from {type(chunk_obj)}")
@@ -136,13 +148,19 @@ def create_assistant_complete_response_data(complete_resp_obj: Any) -> Assistant
         return AssistantCompleteResponseData(
             content=str(getattr(complete_resp_obj, 'content', '')),
             reasoning=getattr(complete_resp_obj, 'reasoning', None),
-            usage=parsed_usage
+            usage=parsed_usage,
+            image_urls=getattr(complete_resp_obj, 'image_urls', None),
+            audio_urls=getattr(complete_resp_obj, 'audio_urls', None),
+            video_urls=getattr(complete_resp_obj, 'video_urls', None)
         )
     elif isinstance(complete_resp_obj, dict):
         return AssistantCompleteResponseData(
             content=str(complete_resp_obj.get('content', '')),
             reasoning=complete_resp_obj.get('reasoning', None),
-            usage=parsed_usage
+            usage=parsed_usage,
+            image_urls=complete_resp_obj.get('image_urls', None),
+            audio_urls=complete_resp_obj.get('audio_urls', None),
+            video_urls=complete_resp_obj.get('video_urls', None)
         )
     raise ValueError(f"Cannot create AssistantCompleteResponseData from {type(complete_resp_obj)}")
@@ -177,3 +195,4 @@ def create_system_task_notification_data(notification_data_dict: Any) -> SystemT
     if isinstance(notification_data_dict, dict):
         return SystemTaskNotificationData(**notification_data_dict)
     raise ValueError(f"Cannot create SystemTaskNotificationData from {type(notification_data_dict)}")

autobyteus/agent/system_prompt_processor/tool_manifest_injector_processor.py CHANGED Viewed

@@ -47,6 +47,9 @@ class ToolManifestInjectorProcessor(BaseSystemPromptProcessor):
         llm_provider = None
         if context.llm_instance and context.llm_instance.model:
             llm_provider = context.llm_instance.model.provider
+        # Retrieve the override flag from the agent's configuration.
+        use_xml_tool_format = context.config.use_xml_tool_format
         # Generate the manifest string for the 'tools' variable.
         tools_manifest: str
@@ -59,10 +62,11 @@ class ToolManifestInjectorProcessor(BaseSystemPromptProcessor):
             ]
             try:
-                # Delegate manifest generation to the provider, which now handles all format logic.
+                # Delegate manifest generation to the provider, passing the override flag.
                 tools_manifest = self._manifest_provider.provide(
                     tool_definitions=tool_definitions,
-                    provider=llm_provider
+                    provider=llm_provider,
+                    use_xml_tool_format=use_xml_tool_format
                 )
             except Exception as e:
                 logger.exception(f"An unexpected error occurred during tool manifest generation for agent '{agent_id}': {e}")

autobyteus/agent/tool_invocation.py CHANGED Viewed

@@ -2,7 +2,14 @@
 import uuid
 import hashlib
 import json
-from typing import Optional, Dict, Any
+import logging
+from typing import Optional, Dict, Any, List, TYPE_CHECKING
+from dataclasses import dataclass, field
+if TYPE_CHECKING:
+    from autobyteus.agent.events import ToolResultEvent
+logger = logging.getLogger(__name__)
 class ToolInvocation:
     def __init__(self, name: Optional[str] = None, arguments: Optional[Dict[str, Any]] = None, id: Optional[str] = None):
@@ -33,11 +40,15 @@ class ToolInvocation:
         """
         # Create a canonical representation of the arguments
         # sort_keys=True ensures that the order of keys doesn't change the hash
-        canonical_args = json.dumps(arguments, sort_keys=True, separators=(',', ':'))
+        # ensure_ascii=False is critical for cross-language compatibility with JS
+        canonical_args = json.dumps(arguments, sort_keys=True, separators=(',', ':'), ensure_ascii=False)
         # Create a string to hash
         hash_string = f"{name}:{canonical_args}"
+        # --- ADDED LOGGING ---
+        logger.debug(f"Generating tool invocation ID from hash_string: '{hash_string}'")
         # Use SHA256 for a robust hash
         sha256_hash = hashlib.sha256(hash_string.encode('utf-8')).hexdigest()
@@ -54,3 +65,17 @@ class ToolInvocation:
     def __repr__(self) -> str:
         return (f"ToolInvocation(id='{self.id}', name='{self.name}', "
                 f"arguments={self.arguments})")
+@dataclass
+class ToolInvocationTurn:
+    """
+    A data class to encapsulate the state of a multi-tool invocation turn.
+    Its existence in the agent's state signifies that a multi-tool turn is active.
+    """
+    invocations: List[ToolInvocation]
+    results: List['ToolResultEvent'] = field(default_factory=list)
+    def is_complete(self) -> bool:
+        """Checks if all expected tool results have been collected."""
+        return len(self.results) >= len(self.invocations)

autobyteus/agent_team/agent_team_builder.py CHANGED Viewed

@@ -45,6 +45,7 @@ class AgentTeamBuilder:
         self._coordinator_config: Optional[AgentConfig] = None
         self._added_node_names: Set[str] = set()
         self._task_notification_mode: TaskNotificationMode = TaskNotificationMode.AGENT_MANUAL_NOTIFICATION
+        self._use_xml_tool_format: Optional[bool] = None
         logger.info(f"AgentTeamBuilder initialized for team: '{self._name}'.")
     def add_agent_node(self, agent_config: AgentConfig, dependencies: Optional[List[NodeDefinition]] = None) -> 'AgentTeamBuilder':
@@ -142,6 +143,25 @@ class AgentTeamBuilder:
         logger.debug(f"Task notification mode set to '{mode.value}'.")
         return self
+    def set_use_xml_tool_format(self, use_xml: bool) -> 'AgentTeamBuilder':
+        """
+        Sets the team-level override for using XML tool format.
+        If set, this will override the setting on all individual agents within the team.
+        Args:
+            use_xml: If True, forces the team to use XML format for tool
+                     definitions and parsing.
+        Returns:
+            The builder instance for fluent chaining.
+        """
+        if not isinstance(use_xml, bool):
+            raise TypeError("use_xml must be a boolean.")
+        self._use_xml_tool_format = use_xml
+        logger.debug(f"Team-level XML tool format override set to '{use_xml}'.")
+        return self
     def build(self) -> AgentTeam:
         """
         Constructs and returns the final AgentTeam instance using the
@@ -175,7 +195,8 @@ class AgentTeamBuilder:
             role=self._role,
             nodes=tuple(final_nodes),
             coordinator_node=coordinator_node_instance,
-            task_notification_mode=self._task_notification_mode
+            task_notification_mode=self._task_notification_mode,
+            use_xml_tool_format=self._use_xml_tool_format
         )
         logger.info(f"AgentTeamConfig created successfully. Name: '{team_config.name}'. Total nodes: {len(final_nodes)}. Coordinator: '{coordinator_node_instance.name}'.")

autobyteus/agent_team/bootstrap_steps/agent_configuration_preparation_step.py CHANGED Viewed

@@ -15,8 +15,8 @@ logger = logging.getLogger(__name__)
 class AgentConfigurationPreparationStep(BaseAgentTeamBootstrapStep):
     """
     Bootstrap step to prepare the final, immutable configuration for every
-    agent in the team. It injects team-specific context and applies the final
-    coordinator prompt. It no longer injects tools.
+    agent in the team. It injects team-specific context, applies team-level
+    settings like tool format overrides, and prepares the final coordinator prompt.
     """
     async def execute(self, context: 'AgentTeamContext', phase_manager: 'AgentTeamPhaseManager') -> bool:
         team_id = context.team_id
@@ -44,6 +44,13 @@ class AgentConfigurationPreparationStep(BaseAgentTeamBootstrapStep):
                 final_config = node_definition.copy()
+                # --- Team-level Setting Propagation ---
+                # If the team config specifies a tool format, it overrides any agent-level setting.
+                if context.config.use_xml_tool_format is not None:
+                    final_config.use_xml_tool_format = context.config.use_xml_tool_format
+                    logger.debug(f"Team '{team_id}': Applied team-level use_xml_tool_format={final_config.use_xml_tool_format} to agent '{unique_name}'.")
                 # --- Shared Context Injection ---
                 # The shared context is injected into the initial_custom_data dictionary,
                 # which is then used by the AgentFactory to create the AgentRuntimeState.

autobyteus/agent_team/context/agent_team_config.py CHANGED Viewed

@@ -20,6 +20,7 @@ class AgentTeamConfig:
     coordinator_node: TeamNodeConfig
     role: Optional[str] = None
     task_notification_mode: TaskNotificationMode = TaskNotificationMode.AGENT_MANUAL_NOTIFICATION
+    use_xml_tool_format: Optional[bool] = None
     def __post_init__(self):
         if not self.name or not isinstance(self.name, str):

autobyteus/agent_team/context/agent_team_runtime_state.py CHANGED Viewed

@@ -14,7 +14,6 @@ if TYPE_CHECKING:
     from autobyteus.agent_team.context.team_manager import TeamManager
     from autobyteus.agent_team.streaming.agent_event_multiplexer import AgentEventMultiplexer
     from autobyteus.task_management.base_task_board import BaseTaskBoard
-    from autobyteus.task_management.artifacts.artifact_manifest import ArtifactManifest
     from autobyteus.agent_team.task_notification.system_event_driven_agent_task_notifier import SystemEventDrivenAgentTaskNotifier
 logger = logging.getLogger(__name__)
@@ -40,7 +39,6 @@ class AgentTeamRuntimeState:
     # Dynamic planning and artifact state
     task_board: Optional['BaseTaskBoard'] = None
-    artifact_registry: Dict[str, 'ArtifactManifest'] = field(default_factory=dict)
     def __post_init__(self):
         if not self.team_id or not isinstance(self.team_id, str):

autobyteus/llm/api/autobyteus_llm.py CHANGED Viewed

@@ -4,6 +4,7 @@ from autobyteus.llm.models import LLMModel
 from autobyteus.llm.utils.llm_config import LLMConfig
 from autobyteus.llm.utils.token_usage import TokenUsage
 from autobyteus.llm.utils.response_types import CompleteResponse, ChunkResponse
+from autobyteus.llm.user_message import LLMUserMessage
 from autobyteus_llm_client.client import AutobyteusClient
 import logging
 import uuid
@@ -12,36 +13,35 @@ logger = logging.getLogger(__name__)
 class AutobyteusLLM(BaseLLM):
     def __init__(self, model: LLMModel, llm_config: LLMConfig):
-        # The host URL is now passed via the model object.
         if not model.host_url:
             raise ValueError("AutobyteusLLM requires a host_url to be set in its LLMModel object.")
         super().__init__(model=model, llm_config=llm_config)
-        # Instantiate the client with the specific host for this model.
         self.client = AutobyteusClient(server_url=self.model.host_url)
         self.conversation_id = str(uuid.uuid4())
         logger.info(f"AutobyteusLLM initialized for model '{self.model.model_identifier}' with conversation ID: {self.conversation_id}")
     async def _send_user_message_to_llm(
         self,
-        user_message: str,
-        image_urls: Optional[List[str]] = None,
+        user_message: LLMUserMessage,
         **kwargs
     ) -> CompleteResponse:
         self.add_user_message(user_message)
         try:
             response = await self.client.send_message(
                 conversation_id=self.conversation_id,
-                model_name=self.model.name, # Use `name` as it's the original model name for the API
-                user_message=user_message,
-                image_urls=image_urls
+                model_name=self.model.name,
+                user_message=user_message.content,
+                image_urls=user_message.image_urls,
+                audio_urls=user_message.audio_urls,
+                video_urls=user_message.video_urls
             )
             assistant_message = response['response']
             self.add_assistant_message(assistant_message)
-            token_usage_data = response.get('token_usage', {})
+            token_usage_data = response.get('token_usage') or {}
             token_usage = TokenUsage(
                 prompt_tokens=token_usage_data.get('prompt_tokens', 0),
                 completion_tokens=token_usage_data.get('completion_tokens', 0),
@@ -59,8 +59,7 @@ class AutobyteusLLM(BaseLLM):
     async def _stream_user_message_to_llm(
         self,
-        user_message: str,
-        image_urls: Optional[List[str]] = None,
+        user_message: LLMUserMessage,
         **kwargs
     ) -> AsyncGenerator[ChunkResponse, None]:
         self.add_user_message(user_message)
@@ -69,36 +68,38 @@ class AutobyteusLLM(BaseLLM):
         try:
             async for chunk in self.client.stream_message(
                 conversation_id=self.conversation_id,
-                model_name=self.model.name, # Use `name` for the API call
-                user_message=user_message,
-                image_urls=image_urls
+                model_name=self.model.name,
+                user_message=user_message.content,
+                image_urls=user_message.image_urls,
+                audio_urls=user_message.audio_urls,
+                video_urls=user_message.video_urls
             ):
                 if 'error' in chunk:
                     raise RuntimeError(chunk['error'])
                 content = chunk.get('content', '')
-                complete_response += content
+                if content:
+                    complete_response += content
                 is_complete = chunk.get('is_complete', False)
-                # If this is the final chunk, include token usage
+                token_usage = None
                 if is_complete:
-                    token_usage = None
-                    if chunk.get('token_usage'):
-                        token_usage = TokenUsage(
-                            prompt_tokens=chunk['token_usage'].get('prompt_tokens', 0),
-                            completion_tokens=chunk['token_usage'].get('completion_tokens', 0),
-                            total_tokens=chunk['token_usage'].get('total_tokens', 0)
-                        )
-                    yield ChunkResponse(
-                        content=content,
-                        is_complete=True,
-                        usage=token_usage
-                    )
-                else:
-                    yield ChunkResponse(
-                        content=content,
-                        is_complete=False
+                    token_usage_data = chunk.get('token_usage') or {}
+                    token_usage = TokenUsage(
+                        prompt_tokens=token_usage_data.get('prompt_tokens', 0),
+                        completion_tokens=token_usage_data.get('completion_tokens', 0),
+                        total_tokens=token_usage_data.get('total_tokens', 0)
                     )
+                yield ChunkResponse(
+                    content=content,
+                    reasoning=chunk.get('reasoning'),
+                    is_complete=is_complete,
+                    image_urls=chunk.get('image_urls', []),
+                    audio_urls=chunk.get('audio_urls', []),
+                    video_urls=chunk.get('video_urls', []),
+                    usage=token_usage
+                )
             self.add_assistant_message(complete_response)
         except Exception as e:
@@ -116,7 +117,6 @@ class AutobyteusLLM(BaseLLM):
             await self.client.close()
     async def _handle_error_cleanup(self):
-        """Handle cleanup operations after errors"""
         try:
             await self.cleanup()
         except Exception as cleanup_error:

autobyteus/llm/api/bedrock_llm.py CHANGED Viewed

@@ -9,10 +9,10 @@ from autobyteus.llm.utils.llm_config import LLMConfig
 from autobyteus.llm.utils.messages import MessageRole, Message
 from autobyteus.llm.utils.token_usage import TokenUsage
 from autobyteus.llm.utils.response_types import CompleteResponse, ChunkResponse
+from autobyteus.llm.user_message import LLMUserMessage
 class BedrockLLM(BaseLLM):
     def __init__(self, model: LLMModel = None, llm_config: LLMConfig = None):
-        # Provide defaults if not specified
         if model is None:
             model = LLMModel.BEDROCK_CLAUDE_3_5_SONNET_API
         if llm_config is None:
@@ -43,14 +43,17 @@ class BedrockLLM(BaseLLM):
         except Exception as e:
             raise ValueError(f"Failed to initialize Bedrock client: {str(e)}")
-    async def _send_user_message_to_llm(self, user_message: str, image_urls: Optional[List[str]] = None, **kwargs) -> CompleteResponse:
+    async def _send_user_message_to_llm(self, user_message: LLMUserMessage, **kwargs) -> CompleteResponse:
         self.add_user_message(user_message)
+        # NOTE: This implementation does not yet support multimodal inputs for Bedrock.
+        # It will only send the text content.
         request_body = json.dumps({
             "anthropic_version": "bedrock-2023-05-31",
             "max_tokens": 1000,
             "temperature": 0,
-            "messages": [msg.to_dict() for msg in self.messages],
+            "messages": [msg.to_dict() for msg in self.messages if msg.role != MessageRole.SYSTEM],
             "system": self.system_message if self.system_message else ""
         })
@@ -79,6 +82,11 @@ class BedrockLLM(BaseLLM):
             raise ValueError(f"Bedrock API error: {error_code} - {error_message}")
         except Exception as e:
             raise ValueError(f"Error in Bedrock API call: {str(e)}")
+    async def _stream_user_message_to_llm(self, user_message: LLMUserMessage, **kwargs) -> AsyncGenerator[ChunkResponse, None]:
+        # Placeholder for future implementation
+        response = await self._send_user_message_to_llm(user_message, **kwargs)
+        yield ChunkResponse(content=response.content, is_complete=True, usage=response.usage)
     async def cleanup(self):
-        super().cleanup()
+        await super().cleanup()

autobyteus 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl

autobyteus 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl