PyPI - autobyteus - Versions diffs - 1.1.6__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

autobyteus 1.1.6py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

autobyteus/agent/context/agent_runtime_state.py +7 -1
autobyteus/agent/handlers/tool_result_event_handler.py +100 -88
autobyteus/agent/llm_response_processor/provider_aware_tool_usage_processor.py +7 -1
autobyteus/agent/tool_invocation.py +25 -1
autobyteus/agent_team/agent_team_builder.py +22 -1
autobyteus/agent_team/context/agent_team_runtime_state.py +0 -2
autobyteus/llm/llm_factory.py +25 -57
autobyteus/llm/ollama_provider_resolver.py +1 -0
autobyteus/llm/providers.py +1 -0
autobyteus/llm/token_counter/token_counter_factory.py +2 -0
autobyteus/multimedia/audio/audio_model.py +2 -1
autobyteus/multimedia/image/image_model.py +2 -1
autobyteus/task_management/tools/publish_task_plan.py +4 -16
autobyteus/task_management/tools/update_task_status.py +4 -19
autobyteus/tools/__init__.py +2 -4
autobyteus/tools/base_tool.py +98 -29
autobyteus/tools/browser/standalone/__init__.py +0 -1
autobyteus/tools/google_search.py +149 -0
autobyteus/tools/mcp/schema_mapper.py +29 -71
autobyteus/tools/multimedia/audio_tools.py +3 -3
autobyteus/tools/multimedia/image_tools.py +5 -5
autobyteus/tools/parameter_schema.py +82 -89
autobyteus/tools/pydantic_schema_converter.py +81 -0
autobyteus/tools/usage/formatters/default_json_example_formatter.py +89 -20
autobyteus/tools/usage/formatters/default_xml_example_formatter.py +115 -41
autobyteus/tools/usage/formatters/default_xml_schema_formatter.py +50 -20
autobyteus/tools/usage/formatters/gemini_json_example_formatter.py +55 -22
autobyteus/tools/usage/formatters/google_json_example_formatter.py +54 -21
autobyteus/tools/usage/formatters/openai_json_example_formatter.py +53 -23
autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py +270 -94
autobyteus/tools/usage/providers/tool_manifest_provider.py +39 -14
autobyteus-1.1.7.dist-info/METADATA +204 -0
{autobyteus-1.1.6.dist-info → autobyteus-1.1.7.dist-info}/RECORD +39 -40
examples/run_google_slides_agent.py +2 -2
examples/run_mcp_google_slides_client.py +1 -1
examples/run_sqlite_agent.py +1 -1
autobyteus/tools/ask_user_input.py +0 -40
autobyteus/tools/browser/standalone/factory/google_search_factory.py +0 -25
autobyteus/tools/browser/standalone/google_search_ui.py +0 -126
autobyteus-1.1.6.dist-info/METADATA +0 -161
{autobyteus-1.1.6.dist-info → autobyteus-1.1.7.dist-info}/WHEEL +0 -0
{autobyteus-1.1.6.dist-info → autobyteus-1.1.7.dist-info}/licenses/LICENSE +0 -0
{autobyteus-1.1.6.dist-info → autobyteus-1.1.7.dist-info}/top_level.txt +0 -0

autobyteus/tools/usage/parsers/default_xml_tool_usage_parser.py CHANGED Viewed

@@ -1,126 +1,302 @@
-import xml.etree.ElementTree as ET
-import re
-import uuid
-import html
-from xml.sax.saxutils import escape
-import xml.parsers.expat
 import logging
+import re
 from typing import TYPE_CHECKING, Dict, Any, List
+from dataclasses import dataclass, field
 from autobyteus.agent.tool_invocation import ToolInvocation
 from .base_parser import BaseToolUsageParser
-from .exceptions import ToolUsageParseException
 if TYPE_CHECKING:
     from autobyteus.llm.utils.response_types import CompleteResponse
 logger = logging.getLogger(__name__)
+# A unique UUID to use as an internal key for storing text content.
+# This prevents any potential collision with user-provided argument names.
+_INTERNAL_TEXT_KEY_UUID = "4e1a3b1e-3b2a-4d3c-9a8b-2a1c2b3d4e5f"
+# --- Internal Arguments Parser with State Machine ---
+# This entire section is now encapsulated in its own class for clarity.
+class _XmlArgumentsParser:
+    """
+    A dedicated parser for the XML content within an <arguments> tag.
+    It encapsulates the state machine and all related logic, separating it
+    from the higher-level tool-finding logic.
+    """
+    # --- Nested State Machine Components ---
+    @dataclass
+    class _ParsingContext:
+        """Holds the shared state for the parsing process."""
+        parser: '_XmlArgumentsParser'
+        input_string: str
+        cursor: int = 0
+        stack: List[Any] = field(default_factory=list)
+        content_buffer: str = ""
+        def __post_init__(self):
+            self.stack.append({}) # Root of arguments is a dictionary
+        def is_eof(self) -> bool:
+            return self.cursor >= len(self.input_string)
+        def append_to_buffer(self, text: str):
+            self.content_buffer += text
+        def commit_content_buffer(self):
+            if self.content_buffer:
+                self.parser._commit_content(self.stack, self.content_buffer)
+                self.content_buffer = ""
+    class _ParserState:
+        """Abstract base class for a state in our parser's state machine."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            raise NotImplementedError
+    class _ParsingContentState(_ParserState):
+        """Handles accumulation of character data between tags."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            if context.is_eof():
+                return None
+            next_tag_start = context.input_string.find('<', context.cursor)
+            if next_tag_start == -1:
+                context.append_to_buffer(context.input_string[context.cursor:])
+                context.cursor = len(context.input_string)
+                return self
+            is_valid_tag = False
+            if next_tag_start + 1 < len(context.input_string):
+                next_char = context.input_string[next_tag_start + 1]
+                if next_char.isalpha() or next_char == '/':
+                    is_valid_tag = True
+            if is_valid_tag:
+                content_before_tag = context.input_string[context.cursor:next_tag_start]
+                context.append_to_buffer(content_before_tag)
+                context.commit_content_buffer()
+                context.cursor = next_tag_start
+                return self.parser._ParsingTagState(self.parser)
+            else:
+                content_with_char = context.input_string[context.cursor : next_tag_start + 1]
+                context.append_to_buffer(content_with_char)
+                context.cursor = next_tag_start + 1
+                return self
+        def __init__(self, parser: '_XmlArgumentsParser'):
+            self.parser = parser
+    class _ParsingTagState(_ParserState):
+        """Handles parsing of a tag, from '<' to '>'."""
+        def handle(self, context: '_XmlArgumentsParser._ParsingContext') -> '_XmlArgumentsParser._ParserState':
+            tag_content_end = context.input_string.find('>', context.cursor)
+            if tag_content_end == -1:
+                context.append_to_buffer(context.input_string[context.cursor:])
+                context.cursor = len(context.input_string)
+                return self.parser._ParsingContentState(self.parser)
+            tag_content = context.input_string[context.cursor + 1 : tag_content_end]
+            context.parser.process_tag(tag_content, context)
+            context.cursor = tag_content_end + 1
+            return self.parser._ParsingContentState(self.parser)
+        def __init__(self, parser: '_XmlArgumentsParser'):
+            self.parser = parser
+    # --- Parser Implementation ---
+    def __init__(self, xml_string: str):
+        self.xml_string = xml_string
+    def parse(self) -> Dict[str, Any]:
+        """Drives the state machine to parse the XML string."""
+        context = self._ParsingContext(parser=self, input_string=self.xml_string)
+        state = self._ParsingContentState(self)
+        while state and not context.is_eof():
+            state = state.handle(context)
+        context.commit_content_buffer()
+        final_args = context.stack[0]
+        self._cleanup_internal_keys(final_args)
+        return final_args
+    def process_tag(self, tag_content: str, context: '_ParsingContext'):
+        STRUCTURAL_TAGS = {'arg', 'item'}
+        stripped_content = tag_content.strip()
+        if not stripped_content:
+            context.append_to_buffer(f"<{tag_content}>")
+            return
+        is_closing = stripped_content.startswith('/')
+        tag_name = (stripped_content[1:] if is_closing else stripped_content).split(' ')[0]
+        if tag_name in STRUCTURAL_TAGS:
+            if is_closing:
+                self._handle_closing_tag(context.stack)
+            else:
+                self._handle_opening_tag(context.stack, tag_content)
+        else:
+            context.append_to_buffer(f"<{tag_content}>")
+    def _commit_content(self, stack: List[Any], content: str):
+        trimmed_content = content.strip()
+        if not trimmed_content and '<' not in content and '>' not in content:
+            return
+        top = stack[-1]
+        if isinstance(top, dict):
+            top[_INTERNAL_TEXT_KEY_UUID] = top.get(_INTERNAL_TEXT_KEY_UUID, '') + content
+    def _handle_opening_tag(self, stack: List[Any], tag_content: str):
+        parent = stack[-1]
+        if tag_content.strip().startswith('arg'):
+            name_match = re.search(r'name="([^"]+)"', tag_content)
+            if name_match and isinstance(parent, dict):
+                arg_name = name_match.group(1)
+                new_container = {}
+                parent[arg_name] = new_container
+                stack.append(new_container)
+        elif tag_content.strip().startswith('item'):
+            if isinstance(parent, dict):
+                grandparent = stack[-2]
+                parent_key = next((k for k, v in grandparent.items() if v is parent), None)
+                if parent_key:
+                    new_list = []
+                    grandparent[parent_key] = new_list
+                    stack[-1] = new_list
+                    parent = new_list
+            if isinstance(parent, list):
+                new_item_container = {}
+                parent.append(new_item_container)
+                stack.append(new_item_container)
+    def _handle_closing_tag(self, stack: List[Any]):
+        if len(stack) > 1:
+            top = stack.pop()
+            parent = stack[-1]
+            is_primitive = False
+            if isinstance(top, dict):
+                keys = top.keys()
+                if not keys or (len(keys) == 1 and _INTERNAL_TEXT_KEY_UUID in keys):
+                    is_primitive = True
+            if is_primitive:
+                value = top.get(_INTERNAL_TEXT_KEY_UUID, '')
+                if isinstance(parent, list):
+                    try:
+                        idx = parent.index(top)
+                        parent[idx] = value
+                    except ValueError:
+                        logger.warning("Could not find item to collapse in parent list.")
+                elif isinstance(parent, dict):
+                    parent_key = next((k for k, v in parent.items() if v is top), None)
+                    if parent_key:
+                        parent[parent_key] = value
+    def _cleanup_internal_keys(self, data: Any):
+        if isinstance(data, dict):
+            if _INTERNAL_TEXT_KEY_UUID in data and len(data) > 1:
+                del data[_INTERNAL_TEXT_KEY_UUID]
+            for value in data.values():
+                self._cleanup_internal_keys(value)
+        elif isinstance(data, list):
+            for item in data:
+                self._cleanup_internal_keys(item)
+# --- Main Parser Class ---
 class DefaultXmlToolUsageParser(BaseToolUsageParser):
     """
-    Parses LLM responses for tool usage commands formatted as XML using a robust,
-    stateful, character-by-character scanning approach. This parser can correctly
-    identify and extract valid <tool>...</tool> blocks even when they are mixed with
-    conversational text, malformed XML, or other noise.
+    Parses LLM responses for tool usage commands formatted as XML.
+    This class is responsible for finding <tool> blocks and delegating the
+    parsing of their arguments to the specialized _XmlArgumentsParser.
     """
     def get_name(self) -> str:
         return "default_xml_tool_usage_parser"
     def parse(self, response: 'CompleteResponse') -> List[ToolInvocation]:
         text = response.content
         invocations: List[ToolInvocation] = []
-        cursor = 0
-        while cursor < len(text):
-            # Find the start of the next potential tool tag from the current cursor position
-            tool_start_index = text.find('<tool', cursor)
-            if tool_start_index == -1:
-                break # No more tool tags in the rest of the string
-            # Find the end of that opening <tool ...> tag. This is a potential end.
-            tool_start_tag_end = text.find('>', tool_start_index)
-            if tool_start_tag_end == -1:
-                # Incomplete tag at the end of the file, break
+        i = 0
+        while i < len(text):
+            try:
+                i = text.index('<tool', i)
+            except ValueError:
                 break
-            # Check if another '<' appears before the '>', which would indicate a malformed/aborted tag.
-            # Example: <tool name="abc" ... <tool name="xyz">
-            next_opening_bracket = text.find('<', tool_start_index + 1)
-            if next_opening_bracket != -1 and next_opening_bracket < tool_start_tag_end:
-                # The tag was not closed properly before another one started.
-                # Advance the cursor to this new tag and restart the loop.
-                cursor = next_opening_bracket
-                continue
+            open_tag_end = text.find('>', i)
+            if open_tag_end == -1: break
-            # Find the corresponding </tool> closing tag
-            tool_end_index = text.find('</tool>', tool_start_tag_end)
-            if tool_end_index == -1:
-                # Found a start tag but no end tag, treat as fragment and advance
-                cursor = tool_start_tag_end + 1
+            open_tag_content = text[i:open_tag_end+1]
+            name_match = re.search(r'name="([^"]+)"', open_tag_content)
+            if not name_match:
+                i = open_tag_end + 1
                 continue
+            tool_name = name_match.group(1)
+            logger.debug(f"--- Found tool '{tool_name}' at index {i} ---")
-            # Extract the full content of this potential tool block
-            block_end_pos = tool_end_index + len('</tool>')
-            tool_block = text[tool_start_index:block_end_pos]
+            cursor = open_tag_end + 1
+            nesting_level = 1
+            content_end = -1
-            # CRITICAL NESTING CHECK:
-            # Check if there is another '<tool' start tag within this block.
-            # If so, it means this is a malformed, nested block. We must skip it
-            # and let the loop find the inner tag on the next iteration.
-            # This check is now more of a safeguard, as the logic above should handle most cases.
-            if '<tool' in tool_block[1:]:
-                # Advance cursor past the opening tag of this malformed block to continue scanning
-                cursor = tool_start_tag_end + 1
-                continue
+            while cursor < len(text):
+                next_open = text.find('<tool', cursor)
+                next_close = text.find('</tool>', cursor)
-            # This is a valid, non-nested block. Attempt to parse it.
-            try:
-                # Preprocessing and parsing
-                processed_block = self._preprocess_xml_for_parsing(tool_block)
-                root = ET.fromstring(processed_block)
-                tool_name = root.attrib.get("name")
-                if not tool_name:
-                    logger.warning(f"Skipping a <tool> block with no name attribute: {processed_block[:100]}")
+                if next_close == -1: break
+                if next_open != -1 and next_open < next_close:
+                    nesting_level += 1
+                    end_of_nested_open = text.find('>', next_open)
+                    if end_of_nested_open == -1: break
+                    cursor = end_of_nested_open + 1
                 else:
-                    arguments = self._parse_arguments_from_xml(root)
-                    tool_id_attr = root.attrib.get('id')
-                    invocation = ToolInvocation(
-                        name=tool_name,
-                        arguments=arguments,
-                        id=tool_id_attr
-                    )
-                    invocations.append(invocation)
-                    logger.info(f"Successfully parsed XML tool invocation for '{tool_name}'.")
-            except (ET.ParseError, xml.parsers.expat.ExpatError) as e:
-                # The self-contained block was still malformed. Log and ignore it.
-                logger.warning(f"Skipping malformed XML tool block: {e}")
+                    nesting_level -= 1
+                    if nesting_level == 0:
+                        content_end = next_close
+                        break
+                    cursor = next_close + len('</tool>')
+            if content_end == -1:
+                logger.warning(f"Malformed XML for tool '{tool_name}': could not find matching </tool> tag.")
+                i = open_tag_end + 1
+                continue
+            tool_content = text[open_tag_end+1:content_end]
+            args_match = re.search(r'<arguments>(.*)</arguments>', tool_content, re.DOTALL)
-            # CRITICAL: Advance cursor past the entire block we just processed
-            cursor = block_end_pos
+            arguments = {}
+            if args_match:
+                arguments_xml = args_match.group(1)
+                try:
+                    # Delegate parsing to the specialized class
+                    arguments = self._parse_arguments(arguments_xml)
+                except Exception as e:
+                    logger.error(f"Arguments parser failed for tool '{tool_name}': {e}", exc_info=True)
+            invocations.append(ToolInvocation(name=tool_name, arguments=arguments))
+            i = content_end + len('</tool>')
         return invocations
-    def _preprocess_xml_for_parsing(self, xml_content: str) -> str:
-        # This function remains the same as it's not part of the core logic error.
-        # It's a helper for cleaning up minor syntax issues before parsing.
-        return xml_content
-    def _parse_arguments_from_xml(self, command_element: ET.Element) -> Dict[str, Any]:
-        """Helper to extract arguments from a parsed <tool> element."""
-        arguments: Dict[str, Any] = {}
-        arguments_container = command_element.find('arguments')
-        if arguments_container is None:
-            return arguments
-        for arg_element in arguments_container.findall('arg'):
-            arg_name = arg_element.attrib.get('name')
-            if arg_name:
-                # Use .text to get only the direct text content of the tag.
-                # This is safer than itertext() if the LLM hallucinates nested tags.
-                # The XML parser already handles unescaping of standard entities.
-                raw_text = arg_element.text or ""
-                arguments[arg_name] = raw_text
-        return arguments
+    def _parse_arguments(self, xml_string: str) -> Dict[str, Any]:
+        """
+        Delegates parsing of an arguments XML string to the dedicated parser class.
+        """
+        parser = _XmlArgumentsParser(xml_string)
+        return parser.parse()

autobyteus/tools/usage/providers/tool_manifest_provider.py CHANGED Viewed

@@ -16,14 +16,36 @@ class ToolManifestProvider:
     """
     Generates a complete tool manifest string, which includes the schema
     and an example for each provided tool. This is suitable for injection
     into a system prompt. It uses the central ToolFormattingRegistry to get
     the correct formatters for the specified provider.
     """
-    SCHEMA_HEADER = "## Tool Definition:"
-    EXAMPLE_HEADER = "## Example Usage:"
-    # UPDATED: Changed the header to be more descriptive as requested.
+    # --- XML Specific Headers and Guidelines ---
+    XML_SCHEMA_HEADER = "## Tool Definition:"
+    XML_EXAMPLE_HEADER = "## Tool Usage Examples and Guidelines:"
+    XML_GENERAL_GUIDELINES = (
+        "To use this tool, you must construct an XML block exactly like the examples below. "
+        "Ensure all tags are correctly named and nested. Pay close attention to how arguments, "
+        "especially complex ones like lists and objects, are formatted."
+    )
+    XML_ARRAY_GUIDELINES = (
+        "Formatting Lists/Arrays: For any argument that is a list (an array), you MUST wrap each "
+        "individual value in its own `<item>` tag. Do not use comma-separated strings or JSON-style `[...]` arrays within a single tag.\n\n"
+        "Correct:\n"
+        '<arg name="dependencies">\n'
+        '    <item>task_1</item>\n'
+        '    <item>task_2</item>\n'
+        '</arg>\n\n'
+        "Incorrect:\n"
+        '<arg name="dependencies">[task_1, task_2]</arg>\n'
+        '<arg name="dependencies">task_1, task_2</arg>'
+    )
+    # --- JSON Specific Headers ---
+    JSON_SCHEMA_HEADER = "## Tool Definition:"
     JSON_EXAMPLE_HEADER = "Example: To use this tool, you could provide the following JSON object as a tool call:"
     def __init__(self):
         self._formatting_registry = ToolFormattingRegistry()
         logger.debug("ToolManifestProvider initialized.")
@@ -45,33 +67,36 @@ class ToolManifestProvider:
         """
         tool_blocks = []
-        # Get the correct formatting pair from the registry, passing the override flag.
         formatter_pair = self._formatting_registry.get_formatter_pair(provider, use_xml_tool_format=use_xml_tool_format)
         schema_formatter = formatter_pair.schema_formatter
         example_formatter = formatter_pair.example_formatter
-        # Determine if the chosen formatter is XML-based. This determines the final assembly format.
         is_xml_format = isinstance(schema_formatter, DefaultXmlSchemaFormatter)
         for td in tool_definitions:
             try:
                 schema = schema_formatter.provide(td)
-                example = example_formatter.provide(td)
+                example = example_formatter.provide(td) # This is now a pre-formatted string for both XML and JSON
                 if schema and example:
                     if is_xml_format:
-                        tool_blocks.append(f"{self.SCHEMA_HEADER}\n{schema}\n\n{self.EXAMPLE_HEADER}\n{example}")
-                    else:  # JSON format
-                        # UPDATED: Removed the redundant {"tool": schema} wrapper.
+                        tool_blocks.append(f"{self.XML_SCHEMA_HEADER}\n{schema}\n\n{self.XML_EXAMPLE_HEADER}\n{example}")
+                    else:
+                        # For JSON, the schema is a dict, but the example is now a pre-formatted string.
                         schema_str = json.dumps(schema, indent=2)
-                        example_str = json.dumps(example, indent=2)
-                        tool_blocks.append(f"{self.SCHEMA_HEADER}\n{schema_str}\n\n{self.JSON_EXAMPLE_HEADER}\n{example_str}")
+                        # FIX: Do NOT call json.dumps() on the 'example' variable, as it is already a string.
+                        tool_blocks.append(f"{self.JSON_SCHEMA_HEADER}\n{schema_str}\n\n{self.JSON_EXAMPLE_HEADER}\n{example}")
                 else:
                     logger.warning(f"Could not generate schema or example for tool '{td.name}' using format {'XML' if is_xml_format else 'JSON'}.")
             except Exception as e:
                 logger.error(f"Failed to generate manifest block for tool '{td.name}': {e}", exc_info=True)
-        # UPDATED: Unify the return for all formats to provide a consistent structure
-        # without the incorrect '[]' wrapper for JSON.
-        return "\n\n---\n\n".join(tool_blocks)
+        # Assemble the final manifest string
+        manifest_content = "\n\n---\n\n".join(tool_blocks)
+        if is_xml_format and manifest_content:
+            # Prepend the general guidelines for XML format
+            return f"{self.XML_GENERAL_GUIDELINES}\n\n{self.XML_ARRAY_GUIDELINES}\n\n---\n\n{manifest_content}"
+        return manifest_content

autobyteus 1.1.6__py3-none-any.whl → 1.1.7__py3-none-any.whl

autobyteus 1.1.6py3-none-any.whl → 1.1.7py3-none-any.whl