PyPI - autobyteus - Versions diffs - 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

autobyteus 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (103) hide show

autobyteus/agent/context/agent_config.py +6 -1
autobyteus/agent/context/agent_runtime_state.py +7 -1
autobyteus/agent/handlers/llm_user_message_ready_event_handler.py +30 -7
autobyteus/agent/handlers/tool_result_event_handler.py +100 -88
autobyteus/agent/handlers/user_input_message_event_handler.py +22 -25
autobyteus/agent/llm_response_processor/provider_aware_tool_usage_processor.py +7 -1
autobyteus/agent/message/__init__.py +7 -5
autobyteus/agent/message/agent_input_user_message.py +6 -16
autobyteus/agent/message/context_file.py +24 -24
autobyteus/agent/message/context_file_type.py +29 -8
autobyteus/agent/message/multimodal_message_builder.py +47 -0
autobyteus/agent/streaming/stream_event_payloads.py +23 -4
autobyteus/agent/system_prompt_processor/tool_manifest_injector_processor.py +6 -2
autobyteus/agent/tool_invocation.py +27 -2
autobyteus/agent_team/agent_team_builder.py +22 -1
autobyteus/agent_team/bootstrap_steps/agent_configuration_preparation_step.py +9 -2
autobyteus/agent_team/context/agent_team_config.py +1 -0
autobyteus/agent_team/context/agent_team_runtime_state.py +0 -2
autobyteus/llm/api/autobyteus_llm.py +33 -33
autobyteus/llm/api/bedrock_llm.py +13 -5
autobyteus/llm/api/claude_llm.py +13 -27
autobyteus/llm/api/gemini_llm.py +108 -42
autobyteus/llm/api/groq_llm.py +4 -3
autobyteus/llm/api/mistral_llm.py +97 -51
autobyteus/llm/api/nvidia_llm.py +6 -5
autobyteus/llm/api/ollama_llm.py +37 -12
autobyteus/llm/api/openai_compatible_llm.py +91 -91
autobyteus/llm/autobyteus_provider.py +1 -1
autobyteus/llm/base_llm.py +42 -139
autobyteus/llm/extensions/base_extension.py +6 -6
autobyteus/llm/extensions/token_usage_tracking_extension.py +3 -2
autobyteus/llm/llm_factory.py +131 -61
autobyteus/llm/ollama_provider_resolver.py +1 -0
autobyteus/llm/providers.py +1 -0
autobyteus/llm/token_counter/token_counter_factory.py +3 -1
autobyteus/llm/user_message.py +43 -35
autobyteus/llm/utils/llm_config.py +34 -18
autobyteus/llm/utils/media_payload_formatter.py +99 -0
autobyteus/llm/utils/messages.py +32 -25
autobyteus/llm/utils/response_types.py +9 -3
autobyteus/llm/utils/token_usage.py +6 -5
autobyteus/multimedia/__init__.py +31 -0
autobyteus/multimedia/audio/__init__.py +11 -0
autobyteus/multimedia/audio/api/__init__.py +4 -0
autobyteus/multimedia/audio/api/autobyteus_audio_client.py +59 -0
autobyteus/multimedia/audio/api/gemini_audio_client.py +219 -0
autobyteus/multimedia/audio/audio_client_factory.py +120 -0
autobyteus/multimedia/audio/audio_model.py +97 -0
autobyteus/multimedia/audio/autobyteus_audio_provider.py +108 -0
autobyteus/multimedia/audio/base_audio_client.py +40 -0
autobyteus/multimedia/image/__init__.py +11 -0
autobyteus/multimedia/image/api/__init__.py +9 -0
autobyteus/multimedia/image/api/autobyteus_image_client.py +97 -0
autobyteus/multimedia/image/api/gemini_image_client.py +188 -0
autobyteus/multimedia/image/api/openai_image_client.py +142 -0
autobyteus/multimedia/image/autobyteus_image_provider.py +109 -0
autobyteus/multimedia/image/base_image_client.py +67 -0
autobyteus/multimedia/image/image_client_factory.py +118 -0
autobyteus/multimedia/image/image_model.py +97 -0
autobyteus/multimedia/providers.py +5 -0
autobyteus/multimedia/runtimes.py +8 -0
autobyteus/multimedia/utils/__init__.py +10 -0
autobyteus/multimedia/utils/api_utils.py +19 -0
autobyteus/multimedia/utils/multimedia_config.py +29 -0
autobyteus/multimedia/utils/response_types.py +13 -0
autobyteus/task_management/tools/publish_task_plan.py +4 -16
autobyteus/task_management/tools/update_task_status.py +4 -19
autobyteus/tools/__init__.py +5 -4
autobyteus/tools/base_tool.py +98 -29
autobyteus/tools/browser/standalone/__init__.py +0 -1
autobyteus/tools/google_search.py +149 -0
autobyteus/tools/mcp/schema_mapper.py +29 -71
autobyteus/tools/multimedia/__init__.py +8 -0
autobyteus/tools/multimedia/audio_tools.py +116 -0
autobyteus/tools/multimedia/image_tools.py +186 -0
autobyteus/tools/parameter_schema.py +82 -89
autobyteus/tools/pydantic_schema_converter.py +81 -0
autobyteus/tools/tool_category.py +1 -0
autobyteus/tools/usage/formatters/default_json_example_formatter.py +89 -20
autobyteus/tools/usage/formatters/default_xml_example_formatter.py +115 -41
autobyteus/tools/usage/formatters/default_xml_schema_formatter.py +50 -20
autobyteus/tools/usage/formatters/gemini_json_example_formatter.py +55 -22
autobyteus/tools/usage/formatters/google_json_example_formatter.py +54 -21
autobyteus/tools/usage/formatters/openai_json_example_formatter.py +53 -23
autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py +270 -94
autobyteus/tools/usage/parsers/provider_aware_tool_usage_parser.py +5 -2
autobyteus/tools/usage/providers/tool_manifest_provider.py +43 -16
autobyteus/tools/usage/registries/tool_formatting_registry.py +9 -2
autobyteus/tools/usage/registries/tool_usage_parser_registry.py +9 -2
autobyteus-1.1.7.dist-info/METADATA +204 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/RECORD +98 -71
examples/run_browser_agent.py +1 -1
examples/run_google_slides_agent.py +2 -2
examples/run_mcp_google_slides_client.py +1 -1
examples/run_sqlite_agent.py +1 -1
autobyteus/llm/utils/image_payload_formatter.py +0 -89
autobyteus/tools/ask_user_input.py +0 -40
autobyteus/tools/browser/standalone/factory/google_search_factory.py +0 -25
autobyteus/tools/browser/standalone/google_search_ui.py +0 -126
autobyteus-1.1.5.dist-info/METADATA +0 -161
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/WHEEL +0 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/licenses/LICENSE +0 -0
{autobyteus-1.1.5.dist-info → autobyteus-1.1.7.dist-info}/top_level.txt +0 -0

autobyteus/tools/usage/formatters/google_json_example_formatter.py CHANGED Viewed

@@ -1,7 +1,8 @@
 # file: autobyteus/autobyteus/tools/usage/formatters/google_json_example_formatter.py
-from typing import Dict, Any, TYPE_CHECKING
+import json
+from typing import Dict, Any, TYPE_CHECKING, Optional
-from autobyteus.tools.parameter_schema import ParameterType, ParameterDefinition
+from autobyteus.tools.parameter_schema import ParameterSchema, ParameterDefinition
 from .base_formatter import BaseExampleFormatter
 # Import for reuse of the intelligent example generation logic
 from .default_json_example_formatter import DefaultJsonExampleFormatter
@@ -10,32 +11,64 @@ if TYPE_CHECKING:
     from autobyteus.tools.registry import ToolDefinition
 class GoogleJsonExampleFormatter(BaseExampleFormatter):
-    """Formats a tool usage example into the Google JSON tool_calls format."""
+    """
+    Formats a tool usage example into the Google JSON tool_calls format.
+    Provides both basic (required only) and advanced (all) examples if optional
+    parameters exist for the tool.
+    """
-    def provide(self, tool_definition: 'ToolDefinition') -> Dict:
+    def provide(self, tool_definition: 'ToolDefinition') -> str:
+        """
+        Generates a formatted string containing basic and optionally an advanced usage example for the tool.
+        """
+        basic_example_dict = self._create_example_structure(tool_definition, mode='basic')
+        basic_example_str = "### Example 1: Basic Call (Required Arguments)\n"
+        basic_example_str += "```json\n"
+        basic_example_str += json.dumps(basic_example_dict, indent=2)
+        basic_example_str += "\n```"
+        if not self._schema_has_advanced_params(tool_definition.argument_schema):
+            return basic_example_str
+        advanced_example_dict = self._create_example_structure(tool_definition, mode='advanced')
+        advanced_example_str = "### Example 2: Advanced Call (With Optional Arguments)\n"
+        advanced_example_str += "```json\n"
+        advanced_example_str += json.dumps(advanced_example_dict, indent=2)
+        advanced_example_str += "\n```"
+        return f"{basic_example_str}\n\n{advanced_example_str}"
+    def _create_example_structure(self, tool_definition: 'ToolDefinition', mode: str) -> Dict:
+        """Helper to create a single Google tool call example for a given mode."""
         tool_name = tool_definition.name
         arg_schema = tool_definition.argument_schema
         arguments = {}
         if arg_schema and arg_schema.parameters:
-            for param_def in arg_schema.parameters:
-                if param_def.required or param_def.default_value is not None:
-                    arguments[param_def.name] = self._generate_placeholder_value(param_def)
+            params_to_render = arg_schema.parameters
+            if mode == 'basic':
+                params_to_render = [p for p in arg_schema.parameters if p.required]
+            for param_def in params_to_render:
+                # Use the intelligent placeholder generator from the default formatter
+                arguments[param_def.name] = DefaultJsonExampleFormatter._generate_example_from_schema(
+                    param_def.object_schema or param_def.array_item_schema or param_def.param_type,
+                    param_def.object_schema or arg_schema,
+                    mode=mode
+                ) if param_def.object_schema or param_def.array_item_schema else self._generate_simple_placeholder(param_def)
         return {"name": tool_name, "args": arguments}
-    def _generate_placeholder_value(self, param_def: ParameterDefinition) -> Any:
-        # REUSE the intelligent generator for complex objects
-        if param_def.param_type == ParameterType.OBJECT and param_def.object_schema:
-            return DefaultJsonExampleFormatter._generate_example_from_schema(param_def.object_schema, param_def.object_schema)
+    def _schema_has_advanced_params(self, schema: Optional[ParameterSchema]) -> bool:
+        """Recursively checks if a schema or any of its sub-schemas have non-required parameters."""
+        if not schema: return False
+        for param in schema.parameters:
+            if not param.required: return True
+            if param.object_schema and self._schema_has_advanced_params(param.object_schema): return True
+            if isinstance(param.array_item_schema, ParameterSchema) and self._schema_has_advanced_params(param.array_item_schema): return True
+        return False
-        # Fallback for primitives
+    def _generate_simple_placeholder(self, param_def: ParameterDefinition) -> Any:
+        """Generates a simple placeholder for primitive types."""
         if param_def.default_value is not None: return param_def.default_value
-        if param_def.param_type == ParameterType.STRING: return f"example_{param_def.name}"
-        if param_def.param_type == ParameterType.INTEGER: return 123
-        if param_def.param_type == ParameterType.FLOAT: return 123.45
-        if param_def.param_type == ParameterType.BOOLEAN: return True
-        if param_def.param_type == ParameterType.ENUM: return param_def.enum_values[0] if param_def.enum_values else "enum_val"
-        if param_def.param_type == ParameterType.OBJECT: return {"key": "value"}
-        if param_def.param_type == ParameterType.ARRAY: return ["item1", "item2"]
-        return "placeholder"
+        return DefaultJsonExampleFormatter._generate_example_from_schema(param_def.param_type, param_def.param_type, mode='basic')

autobyteus/tools/usage/formatters/openai_json_example_formatter.py CHANGED Viewed

@@ -1,8 +1,8 @@
 # file: autobyteus/autobyteus/tools/usage/formatters/openai_json_example_formatter.py
 import json
-from typing import Dict, Any, TYPE_CHECKING
+from typing import Dict, Any, TYPE_CHECKING, Optional
-from autobyteus.tools.parameter_schema import ParameterType, ParameterDefinition
+from autobyteus.tools.parameter_schema import ParameterSchema, ParameterDefinition
 from .base_formatter import BaseExampleFormatter
 from .default_json_example_formatter import DefaultJsonExampleFormatter # Import for reuse
@@ -11,41 +11,71 @@ if TYPE_CHECKING:
 class OpenAiJsonExampleFormatter(BaseExampleFormatter):
     """
-    Formats a tool usage example into a format resembling an entry in the
-    OpenAI JSON 'tool_calls' array, intended for prompting a model.
+    Formats a tool usage example into the OpenAI JSON 'tool_calls' format.
+    Provides both basic (required only) and advanced (all) examples if optional
+    parameters exist for the tool.
     """
+    def provide(self, tool_definition: 'ToolDefinition') -> str:
+        """
+        Generates a formatted string containing basic and optionally an advanced usage example for the tool.
+        """
+        basic_example_dict = self._create_example_structure(tool_definition, mode='basic')
+        basic_example_str = "### Example 1: Basic Call (Required Arguments)\n"
+        basic_example_str += "```json\n"
+        basic_example_str += json.dumps(basic_example_dict, indent=2)
+        basic_example_str += "\n```"
+        if not self._schema_has_advanced_params(tool_definition.argument_schema):
+            return basic_example_str
-    def provide(self, tool_definition: 'ToolDefinition') -> Dict:
+        advanced_example_dict = self._create_example_structure(tool_definition, mode='advanced')
+        advanced_example_str = "### Example 2: Advanced Call (With Optional Arguments)\n"
+        advanced_example_str += "```json\n"
+        advanced_example_str += json.dumps(advanced_example_dict, indent=2)
+        advanced_example_str += "\n```"
+        return f"{basic_example_str}\n\n{advanced_example_str}"
+    def _create_example_structure(self, tool_definition: 'ToolDefinition', mode: str) -> Dict:
+        """Helper to create a single OpenAI tool call example for a given mode."""
         tool_name = tool_definition.name
         arg_schema = tool_definition.argument_schema
         arguments = {}
         if arg_schema and arg_schema.parameters:
-            for param_def in arg_schema.parameters:
-                if param_def.required or param_def.default_value is not None:
-                    arguments[param_def.name] = self._generate_placeholder_value(param_def)
+            params_to_render = arg_schema.parameters
+            if mode == 'basic':
+                params_to_render = [p for p in arg_schema.parameters if p.required]
+            for param_def in params_to_render:
+                # Use the intelligent placeholder generator from the default formatter
+                arguments[param_def.name] = DefaultJsonExampleFormatter._generate_example_from_schema(
+                    param_def.object_schema or param_def.array_item_schema or param_def.param_type,
+                    param_def.object_schema or arg_schema,
+                    mode=mode
+                ) if param_def.object_schema or param_def.array_item_schema else self._generate_simple_placeholder(param_def)
         function_call = {
             "function": {
                 "name": tool_name,
-                "arguments": json.dumps(arguments),
+                # FIX: Keep arguments as a dictionary for clear examples in the prompt.
+                # Do NOT stringify it here.
+                "arguments": arguments,
             },
         }
         return {"tool": function_call}
-    def _generate_placeholder_value(self, param_def: ParameterDefinition) -> Any:
-        # REUSE a more intelligent generator for complex objects
-        if param_def.param_type == ParameterType.OBJECT and param_def.object_schema:
-            return DefaultJsonExampleFormatter._generate_example_from_schema(param_def.object_schema, param_def.object_schema)
+    def _schema_has_advanced_params(self, schema: Optional[ParameterSchema]) -> bool:
+        """Recursively checks if a schema or any of its sub-schemas have non-required parameters."""
+        if not schema: return False
+        for param in schema.parameters:
+            if not param.required: return True
+            if param.object_schema and self._schema_has_advanced_params(param.object_schema): return True
+            if isinstance(param.array_item_schema, ParameterSchema) and self._schema_has_advanced_params(param.array_item_schema): return True
+        return False
-        # Fallback for primitives
+    def _generate_simple_placeholder(self, param_def: ParameterDefinition) -> Any:
+        """Generates a simple placeholder for primitive types."""
         if param_def.default_value is not None: return param_def.default_value
-        if param_def.param_type == ParameterType.STRING: return f"example_{param_def.name}"
-        if param_def.param_type == ParameterType.INTEGER: return 123
-        if param_def.param_type == ParameterType.FLOAT: return 123.45
-        if param_def.param_type == ParameterType.BOOLEAN: return True
-        if param_def.param_type == ParameterType.ENUM: return param_def.enum_values[0] if param_def.enum_values else "enum_val"
-        if param_def.param_type == ParameterType.OBJECT: return {"key": "value"}
-        if param_def.param_type == ParameterType.ARRAY: return ["item1", "item2"]
-        return "placeholder"
+        return DefaultJsonExampleFormatter._generate_example_from_schema(param_def.param_type, param_def.param_type, mode='basic')

autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py CHANGED Viewed

@@ -1,126 +1,302 @@
-import xml.etree.ElementTree as ET
-import re
-import uuid
-import html
-from xml.sax.saxutils import escape
-import xml.parsers.expat
 import logging
+import re
 from typing import TYPE_CHECKING, Dict, Any, List
+from dataclasses import dataclass, field
 from autobyteus.agent.tool_invocation import ToolInvocation
 from .base_parser import BaseToolUsageParser
-from .exceptions import ToolUsageParseException
 if TYPE_CHECKING:
     from autobyteus.llm.utils.response_types import CompleteResponse
 logger = logging.getLogger(__name__)
+# A unique UUID to use as an internal key for storing text content.
+# This prevents any potential collision with user-provided argument names.
+_INTERNAL_TEXT_KEY_UUID = "4e1a3b1e-3b2a-4d3c-9a8b-2a1c2b3d4e5f"
+# --- Internal Arguments Parser with State Machine ---
+# This entire section is now encapsulated in its own class for clarity.
+class _XmlArgumentsParser:
+    """
+    A dedicated parser for the XML content within an <arguments> tag.
+    It encapsulates the state machine and all related logic, separating it
+    from the higher-level tool-finding logic.
+    """
+    # --- Nested State Machine Components ---
+    @dataclass
+    class _ParsingContext:
+        """Holds the shared state for the parsing process."""
+        parser: '_XmlArgumentsParser'
+        input_string: str
+        cursor: int = 0
+        stack: List[Any] = field(default_factory=list)
+        content_buffer: str = ""
+        def __post_init__(self):
+            self.stack.append({}) # Root of arguments is a dictionary
+        def is_eof(self) -> bool:
+            return self.cursor >= len(self.input_string)
+        def append_to_buffer(self, text: str):
+            self.content_buffer += text
+        def commit_content_buffer(self):
+            if self.content_buffer:
+                self.parser._commit_content(self.stack, self.content_buffer)
+                self.content_buffer = ""
+    class _ParserState:
+        """Abstract base class for a state in our parser's state machine."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            raise NotImplementedError
+    class _ParsingContentState(_ParserState):
+        """Handles accumulation of character data between tags."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            if context.is_eof():
+                return None
+            next_tag_start = context.input_string.find('<', context.cursor)
+            if next_tag_start == -1:
+                context.append_to_buffer(context.input_string[context.cursor:])
+                context.cursor = len(context.input_string)
+                return self
+            is_valid_tag = False
+            if next_tag_start + 1 < len(context.input_string):
+                next_char = context.input_string[next_tag_start + 1]
+                if next_char.isalpha() or next_char == '/':
+                    is_valid_tag = True
+            if is_valid_tag:
+                content_before_tag = context.input_string[context.cursor:next_tag_start]
+                context.append_to_buffer(content_before_tag)
+                context.commit_content_buffer()
+                context.cursor = next_tag_start
+                return self.parser._ParsingTagState(self.parser)
+            else:
+                content_with_char = context.input_string[context.cursor : next_tag_start + 1]
+                context.append_to_buffer(content_with_char)
+                context.cursor = next_tag_start + 1
+                return self
+        def __init__(self, parser: '_XmlArgumentsParser'):
+            self.parser = parser
+    class _ParsingTagState(_ParserState):
+        """Handles parsing of a tag, from '<' to '>'."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            tag_content_end = context.input_string.find('>', context.cursor)
+            if tag_content_end == -1:
+                context.append_to_buffer(context.input_string[context.cursor:])
+                context.cursor = len(context.input_string)
+                return self.parser._ParsingContentState(self.parser)
+            tag_content = context.input_string[context.cursor + 1 : tag_content_end]
+            context.parser.process_tag(tag_content, context)
+            context.cursor = tag_content_end + 1
+            return self.parser._ParsingContentState(self.parser)
+        def __init__(self, parser: '_XmlArgumentsParser'):
+            self.parser = parser
+    # --- Parser Implementation ---
+    def __init__(self, xml_string: str):
+        self.xml_string = xml_string
+    def parse(self) -> Dict[str, Any]:
+        """Drives the state machine to parse the XML string."""
+        context = self._ParsingContext(parser=self, input_string=self.xml_string)
+        state = self._ParsingContentState(self)
+        while state and not context.is_eof():
+            state = state.handle(context)
+        context.commit_content_buffer()
+        final_args = context.stack[0]
+        self._cleanup_internal_keys(final_args)
+        return final_args
+    def process_tag(self, tag_content: str, context: '_ParsingContext'):
+        STRUCTURAL_TAGS = {'arg', 'item'}
+        stripped_content = tag_content.strip()
+        if not stripped_content:
+            context.append_to_buffer(f"<{tag_content}>")
+            return
+        is_closing = stripped_content.startswith('/')
+        tag_name = (stripped_content[1:] if is_closing else stripped_content).split(' ')[0]
+        if tag_name in STRUCTURAL_TAGS:
+            if is_closing:
+                self._handle_closing_tag(context.stack)
+            else:
+                self._handle_opening_tag(context.stack, tag_content)
+        else:
+            context.append_to_buffer(f"<{tag_content}>")
+    def _commit_content(self, stack: List[Any], content: str):
+        trimmed_content = content.strip()
+        if not trimmed_content and '<' not in content and '>' not in content:
+            return
+        top = stack[-1]
+        if isinstance(top, dict):
+            top[_INTERNAL_TEXT_KEY_UUID] = top.get(_INTERNAL_TEXT_KEY_UUID, '') + content
+    def _handle_opening_tag(self, stack: List[Any], tag_content: str):
+        parent = stack[-1]
+        if tag_content.strip().startswith('arg'):
+            name_match = re.search(r'name="([^"]+)"', tag_content)
+            if name_match and isinstance(parent, dict):
+                arg_name = name_match.group(1)
+                new_container = {}
+                parent[arg_name] = new_container
+                stack.append(new_container)
+        elif tag_content.strip().startswith('item'):
+            if isinstance(parent, dict):
+                grandparent = stack[-2]
+                parent_key = next((k for k, v in grandparent.items() if v is parent), None)
+                if parent_key:
+                    new_list = []
+                    grandparent[parent_key] = new_list
+                    stack[-1] = new_list
+                    parent = new_list
+            if isinstance(parent, list):
+                new_item_container = {}
+                parent.append(new_item_container)
+                stack.append(new_item_container)
+    def _handle_closing_tag(self, stack: List[Any]):
+        if len(stack) > 1:
+            top = stack.pop()
+            parent = stack[-1]
+            is_primitive = False
+            if isinstance(top, dict):
+                keys = top.keys()
+                if not keys or (len(keys) == 1 and _INTERNAL_TEXT_KEY_UUID in keys):
+                    is_primitive = True
+            if is_primitive:
+                value = top.get(_INTERNAL_TEXT_KEY_UUID, '')
+                if isinstance(parent, list):
+                    try:
+                        idx = parent.index(top)
+                        parent[idx] = value
+                    except ValueError:
+                        logger.warning("Could not find item to collapse in parent list.")
+                elif isinstance(parent, dict):
+                    parent_key = next((k for k, v in parent.items() if v is top), None)
+                    if parent_key:
+                        parent[parent_key] = value
+    def _cleanup_internal_keys(self, data: Any):
+        if isinstance(data, dict):
+            if _INTERNAL_TEXT_KEY_UUID in data and len(data) > 1:
+                del data[_INTERNAL_TEXT_KEY_UUID]
+            for value in data.values():
+                self._cleanup_internal_keys(value)
+        elif isinstance(data, list):
+            for item in data:
+                self._cleanup_internal_keys(item)
+# --- Main Parser Class ---
 class DefaultXmlToolUsageParser(BaseToolUsageParser):
     """
-    Parses LLM responses for tool usage commands formatted as XML using a robust,
-    stateful, character-by-character scanning approach. This parser can correctly
-    identify and extract valid <tool>...</tool> blocks even when they are mixed with
-    conversational text, malformed XML, or other noise.
+    Parses LLM responses for tool usage commands formatted as XML.
+    This class is responsible for finding <tool> blocks and delegating the
+    parsing of their arguments to the specialized _XmlArgumentsParser.
     """
     def get_name(self) -> str:
         return "default_xml_tool_usage_parser"
     def parse(self, response: 'CompleteResponse') -> List[ToolInvocation]:
         text = response.content
         invocations: List[ToolInvocation] = []
-        cursor = 0
-        while cursor < len(text):
-            # Find the start of the next potential tool tag from the current cursor position
-            tool_start_index = text.find('<tool', cursor)
-            if tool_start_index == -1:
-                break # No more tool tags in the rest of the string
-            # Find the end of that opening <tool ...> tag. This is a potential end.
-            tool_start_tag_end = text.find('>', tool_start_index)
-            if tool_start_tag_end == -1:
-                # Incomplete tag at the end of the file, break
+        i = 0
+        while i < len(text):
+            try:
+                i = text.index('<tool', i)
+            except ValueError:
                 break
-            # Check if another '<' appears before the '>', which would indicate a malformed/aborted tag.
-            # Example: <tool name="abc" ... <tool name="xyz">
-            next_opening_bracket = text.find('<', tool_start_index + 1)
-            if next_opening_bracket != -1 and next_opening_bracket < tool_start_tag_end:
-                # The tag was not closed properly before another one started.
-                # Advance the cursor to this new tag and restart the loop.
-                cursor = next_opening_bracket
-                continue
+            open_tag_end = text.find('>', i)
+            if open_tag_end == -1: break
-            # Find the corresponding </tool> closing tag
-            tool_end_index = text.find('</tool>', tool_start_tag_end)
-            if tool_end_index == -1:
-                # Found a start tag but no end tag, treat as fragment and advance
-                cursor = tool_start_tag_end + 1
+            open_tag_content = text[i:open_tag_end+1]
+            name_match = re.search(r'name="([^"]+)"', open_tag_content)
+            if not name_match:
+                i = open_tag_end + 1
                 continue
+            tool_name = name_match.group(1)
+            logger.debug(f"--- Found tool '{tool_name}' at index {i} ---")
-            # Extract the full content of this potential tool block
-            block_end_pos = tool_end_index + len('</tool>')
-            tool_block = text[tool_start_index:block_end_pos]
+            cursor = open_tag_end + 1
+            nesting_level = 1
+            content_end = -1
-            # CRITICAL NESTING CHECK:
-            # Check if there is another '<tool' start tag within this block.
-            # If so, it means this is a malformed, nested block. We must skip it
-            # and let the loop find the inner tag on the next iteration.
-            # This check is now more of a safeguard, as the logic above should handle most cases.
-            if '<tool' in tool_block[1:]:
-                # Advance cursor past the opening tag of this malformed block to continue scanning
-                cursor = tool_start_tag_end + 1
-                continue
+            while cursor < len(text):
+                next_open = text.find('<tool', cursor)
+                next_close = text.find('</tool>', cursor)
-            # This is a valid, non-nested block. Attempt to parse it.
-            try:
-                # Preprocessing and parsing
-                processed_block = self._preprocess_xml_for_parsing(tool_block)
-                root = ET.fromstring(processed_block)
-                tool_name = root.attrib.get("name")
-                if not tool_name:
-                    logger.warning(f"Skipping a <tool> block with no name attribute: {processed_block[:100]}")
+                if next_close == -1: break
+                if next_open != -1 and next_open < next_close:
+                    nesting_level += 1
+                    end_of_nested_open = text.find('>', next_open)
+                    if end_of_nested_open == -1: break
+                    cursor = end_of_nested_open + 1
                 else:
-                    arguments = self._parse_arguments_from_xml(root)
-                    tool_id_attr = root.attrib.get('id')
-                    invocation = ToolInvocation(
-                        name=tool_name,
-                        arguments=arguments,
-                        id=tool_id_attr
-                    )
-                    invocations.append(invocation)
-                    logger.info(f"Successfully parsed XML tool invocation for '{tool_name}'.")
-            except (ET.ParseError, xml.parsers.expat.ExpatError) as e:
-                # The self-contained block was still malformed. Log and ignore it.
-                logger.warning(f"Skipping malformed XML tool block: {e}")
+                    nesting_level -= 1
+                    if nesting_level == 0:
+                        content_end = next_close
+                        break
+                    cursor = next_close + len('</tool>')
+            if content_end == -1:
+                logger.warning(f"Malformed XML for tool '{tool_name}': could not find matching </tool> tag.")
+                i = open_tag_end + 1
+                continue
+            tool_content = text[open_tag_end+1:content_end]
+            args_match = re.search(r'<arguments>(.*)</arguments>', tool_content, re.DOTALL)
-            # CRITICAL: Advance cursor past the entire block we just processed
-            cursor = block_end_pos
+            arguments = {}
+            if args_match:
+                arguments_xml = args_match.group(1)
+                try:
+                    # Delegate parsing to the specialized class
+                    arguments = self._parse_arguments(arguments_xml)
+                except Exception as e:
+                    logger.error(f"Arguments parser failed for tool '{tool_name}': {e}", exc_info=True)
+            invocations.append(ToolInvocation(name=tool_name, arguments=arguments))
+            i = content_end + len('</tool>')
         return invocations
-    def _preprocess_xml_for_parsing(self, xml_content: str) -> str:
-        # This function remains the same as it's not part of the core logic error.
-        # It's a helper for cleaning up minor syntax issues before parsing.
-        return xml_content
-    def _parse_arguments_from_xml(self, command_element: ET.Element) -> Dict[str, Any]:
-        """Helper to extract arguments from a parsed <tool> element."""
-        arguments: Dict[str, Any] = {}
-        arguments_container = command_element.find('arguments')
-        if arguments_container is None:
-            return arguments
-        for arg_element in arguments_container.findall('arg'):
-            arg_name = arg_element.attrib.get('name')
-            if arg_name:
-                # Use .text to get only the direct text content of the tag.
-                # This is safer than itertext() if the LLM hallucinates nested tags.
-                # The XML parser already handles unescaping of standard entities.
-                raw_text = arg_element.text or ""
-                arguments[arg_name] = raw_text
-        return arguments
+    def _parse_arguments(self, xml_string: str) -> Dict[str, Any]:
+        """
+        Delegates parsing of an arguments XML string to the dedicated parser class.
+        """
+        parser = _XmlArgumentsParser(xml_string)
+        return parser.parse()

autobyteus/tools/usage/parsers/provider_aware_tool_usage_parser.py CHANGED Viewed

@@ -44,8 +44,11 @@ class ProviderAwareToolUsageParser:
         else:
             logger.warning(f"Agent '{context.agent_id}': LLM instance or model not available. Cannot determine provider for tool response parsing.")
-        # Get the correct parser directly from the new central registry.
-        parser = self._parser_registry.get_parser(llm_provider)
+        # Retrieve the override flag from the agent's configuration.
+        use_xml_tool_format = context.config.use_xml_tool_format
+        # Get the correct parser from the registry, passing the override flag.
+        parser = self._parser_registry.get_parser(llm_provider, use_xml_tool_format=use_xml_tool_format)
         logger.debug(f"ProviderAwareToolUsageParser selected delegate parser '{parser.get_name()}' for LLM provider '{llm_provider.name if llm_provider else 'Unknown'}'.")

autobyteus 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl

autobyteus 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl