PyPI - chuk-tool-processor - Versions diffs - 0.1.6__py3-none-any.whl → 0.2__py3-none-any.whl - Mend

chuk-tool-processor 0.1.6py3-none-any.whl → 0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of chuk-tool-processor might be problematic. Click here for more details.

Files changed (46) hide show

chuk_tool_processor/core/processor.py +345 -132
chuk_tool_processor/execution/strategies/inprocess_strategy.py +522 -71
chuk_tool_processor/execution/strategies/subprocess_strategy.py +559 -64
chuk_tool_processor/execution/tool_executor.py +282 -24
chuk_tool_processor/execution/wrappers/caching.py +465 -123
chuk_tool_processor/execution/wrappers/rate_limiting.py +199 -86
chuk_tool_processor/execution/wrappers/retry.py +133 -23
chuk_tool_processor/logging/__init__.py +83 -10
chuk_tool_processor/logging/context.py +218 -22
chuk_tool_processor/logging/formatter.py +56 -13
chuk_tool_processor/logging/helpers.py +91 -16
chuk_tool_processor/logging/metrics.py +75 -6
chuk_tool_processor/mcp/mcp_tool.py +80 -35
chuk_tool_processor/mcp/register_mcp_tools.py +74 -56
chuk_tool_processor/mcp/setup_mcp_sse.py +41 -36
chuk_tool_processor/mcp/setup_mcp_stdio.py +39 -37
chuk_tool_processor/mcp/transport/sse_transport.py +351 -105
chuk_tool_processor/models/execution_strategy.py +52 -3
chuk_tool_processor/models/streaming_tool.py +110 -0
chuk_tool_processor/models/tool_call.py +56 -4
chuk_tool_processor/models/tool_result.py +115 -9
chuk_tool_processor/models/validated_tool.py +15 -13
chuk_tool_processor/plugins/discovery.py +115 -70
chuk_tool_processor/plugins/parsers/base.py +13 -5
chuk_tool_processor/plugins/parsers/{function_call_tool_plugin.py → function_call_tool.py} +39 -20
chuk_tool_processor/plugins/parsers/json_tool.py +50 -0
chuk_tool_processor/plugins/parsers/openai_tool.py +88 -0
chuk_tool_processor/plugins/parsers/xml_tool.py +74 -20
chuk_tool_processor/registry/__init__.py +46 -7
chuk_tool_processor/registry/auto_register.py +92 -28
chuk_tool_processor/registry/decorators.py +134 -11
chuk_tool_processor/registry/interface.py +48 -14
chuk_tool_processor/registry/metadata.py +52 -6
chuk_tool_processor/registry/provider.py +75 -36
chuk_tool_processor/registry/providers/__init__.py +49 -10
chuk_tool_processor/registry/providers/memory.py +59 -48
chuk_tool_processor/registry/tool_export.py +208 -39
chuk_tool_processor/utils/validation.py +18 -13
chuk_tool_processor-0.2.dist-info/METADATA +401 -0
chuk_tool_processor-0.2.dist-info/RECORD +58 -0
{chuk_tool_processor-0.1.6.dist-info → chuk_tool_processor-0.2.dist-info}/WHEEL +1 -1
chuk_tool_processor/plugins/parsers/json_tool_plugin.py +0 -38
chuk_tool_processor/plugins/parsers/openai_tool_plugin.py +0 -76
chuk_tool_processor-0.1.6.dist-info/METADATA +0 -462
chuk_tool_processor-0.1.6.dist-info/RECORD +0 -57
{chuk_tool_processor-0.1.6.dist-info → chuk_tool_processor-0.2.dist-info}/top_level.txt +0 -0

chuk_tool_processor/core/processor.py CHANGED Viewed

@@ -1,15 +1,23 @@
 # chuk_tool_processor/core/processor.py
+"""
+Async-native core processor for tool execution.
+This module provides the central ToolProcessor class which handles:
+- Tool call parsing from various input formats
+- Tool execution using configurable strategies
+- Application of execution wrappers (caching, retries, etc.)
+"""
+from __future__ import annotations
 import asyncio
 import time
 import json
 import hashlib
-from typing import Any, Dict, List, Optional, Type, Union
+from typing import Any, Dict, List, Optional, Type, Union, Set
-# imports
 from chuk_tool_processor.models.tool_call import ToolCall
 from chuk_tool_processor.models.tool_result import ToolResult
 from chuk_tool_processor.registry import ToolRegistryInterface, ToolRegistryProvider
-from chuk_tool_processor.execution.tool_executor import ToolExecutor
 from chuk_tool_processor.execution.strategies.inprocess_strategy import InProcessStrategy
 from chuk_tool_processor.execution.wrappers.caching import CacheInterface, InMemoryCache, CachingToolExecutor
 from chuk_tool_processor.execution.wrappers.rate_limiting import RateLimiter, RateLimitedToolExecutor
@@ -21,12 +29,13 @@ from chuk_tool_processor.logging import get_logger, log_context_span, request_lo
 class ToolProcessor:
     """
     Main class for processing tool calls from LLM responses.
-    Combines parsing, execution, and result handling.
+    Combines parsing, execution, and result handling with full async support.
     """
     def __init__(
         self,
         registry: Optional[ToolRegistryInterface] = None,
+        strategy = None,
         default_timeout: float = 10.0,
         max_concurrency: Optional[int] = None,
         enable_caching: bool = True,
@@ -43,6 +52,7 @@ class ToolProcessor:
         Args:
             registry: Tool registry to use. If None, uses the global registry.
+            strategy: Optional execution strategy (default: InProcessStrategy)
             default_timeout: Default timeout for tool execution in seconds.
             max_concurrency: Maximum number of concurrent tool executions.
             enable_caching: Whether to enable result caching.
@@ -56,121 +66,211 @@ class ToolProcessor:
                 If None, uses all available parsers.
         """
         self.logger = get_logger("chuk_tool_processor.processor")
-        # Use provided registry or global registry
-        self.registry = registry or ToolRegistryProvider.get_registry()
-        # Create base executor with in-process strategy
-        self.strategy = InProcessStrategy(
-            registry=self.registry,
-            default_timeout=default_timeout,
-            max_concurrency=max_concurrency,
-        )
-        self.executor = ToolExecutor(
-            registry=self.registry,
-            default_timeout=default_timeout,
-            strategy=self.strategy,
-        )
-        # Apply optional wrappers
-        if enable_retries:
-            self.logger.debug("Enabling retry logic")
-            self.executor = RetryableToolExecutor(
-                executor=self.executor,
-                default_config=RetryConfig(max_retries=max_retries),
-            )
-        if enable_rate_limiting:
-            self.logger.debug("Enabling rate limiting")
-            rate_limiter = RateLimiter(
-                global_limit=global_rate_limit,
-                tool_limits=tool_rate_limits,
-            )
-            self.executor = RateLimitedToolExecutor(
-                executor=self.executor,
-                rate_limiter=rate_limiter,
-            )
-        if enable_caching:
-            self.logger.debug("Enabling result caching")
-            cache = InMemoryCache(default_ttl=cache_ttl)
-            self.executor = CachingToolExecutor(
-                executor=self.executor,
-                cache=cache,
-                default_ttl=cache_ttl,
-            )
-        # Discover plugins if not already done
-        if not plugin_registry.list_plugins().get("parser", []):
-            discover_default_plugins()
-        # Get parser plugins
-        if parser_plugins:
-            self.parsers = [
-                plugin_registry.get_plugin("parser", name)
-                for name in parser_plugins
-                if plugin_registry.get_plugin("parser", name)
-            ]
-        else:
-            parser_names = plugin_registry.list_plugins().get("parser", [])
-            self.parsers = [
-                plugin_registry.get_plugin("parser", name) for name in parser_names
-            ]
-        self.logger.debug(f"Initialized with {len(self.parsers)} parser plugins")
-    async def process_text(
+        # Store initialization parameters for lazy initialization
+        self._registry = registry
+        self._strategy = strategy
+        self.default_timeout = default_timeout
+        self.max_concurrency = max_concurrency
+        self.enable_caching = enable_caching
+        self.cache_ttl = cache_ttl
+        self.enable_rate_limiting = enable_rate_limiting
+        self.global_rate_limit = global_rate_limit
+        self.tool_rate_limits = tool_rate_limits
+        self.enable_retries = enable_retries
+        self.max_retries = max_retries
+        self.parser_plugin_names = parser_plugins
+        # Placeholder for initialized components
+        self.registry = None
+        self.strategy = None
+        self.executor = None
+        self.parsers = []
+        # Flag for tracking initialization state
+        self._initialized = False
+        self._init_lock = asyncio.Lock()
+    async def initialize(self) -> None:
+        """
+        Initialize the processor asynchronously.
+        This method ensures all components are properly initialized before use.
+        It is called automatically by other methods if needed.
+        """
+        # Fast path if already initialized
+        if self._initialized:
+            return
+        # Ensure only one initialization happens at a time
+        async with self._init_lock:
+            # Double-check pattern after acquiring lock
+            if self._initialized:
+                return
+            self.logger.debug("Initializing tool processor")
+            # Get the registry
+            if self._registry is not None:
+                self.registry = self._registry
+            else:
+                self.registry = await ToolRegistryProvider.get_registry()
+            # Create execution strategy if needed
+            if self._strategy is not None:
+                self.strategy = self._strategy
+            else:
+                self.strategy = InProcessStrategy(
+                    registry=self.registry,
+                    default_timeout=self.default_timeout,
+                    max_concurrency=self.max_concurrency,
+                )
+            # Set up the executor chain with optional wrappers
+            executor = self.strategy
+            # Apply wrappers in reverse order (innermost first)
+            if self.enable_retries:
+                self.logger.debug("Enabling retry logic")
+                executor = RetryableToolExecutor(
+                    executor=executor,
+                    default_config=RetryConfig(max_retries=self.max_retries),
+                )
+            if self.enable_rate_limiting:
+                self.logger.debug("Enabling rate limiting")
+                rate_limiter = RateLimiter(
+                    global_limit=self.global_rate_limit,
+                    tool_limits=self.tool_rate_limits,
+                )
+                executor = RateLimitedToolExecutor(
+                    executor=executor,
+                    limiter=rate_limiter,
+                )
+            if self.enable_caching:
+                self.logger.debug("Enabling result caching")
+                cache = InMemoryCache(default_ttl=self.cache_ttl)
+                executor = CachingToolExecutor(
+                    executor=executor,
+                    cache=cache,
+                    default_ttl=self.cache_ttl,
+                )
+            self.executor = executor
+            # Initialize parser plugins
+            # Discover plugins if not already done
+            plugins = plugin_registry.list_plugins().get("parser", [])
+            if not plugins:
+                discover_default_plugins()
+                plugins = plugin_registry.list_plugins().get("parser", [])
+            # Get parser plugins
+            if self.parser_plugin_names:
+                self.parsers = [
+                    plugin_registry.get_plugin("parser", name)
+                    for name in self.parser_plugin_names
+                    if plugin_registry.get_plugin("parser", name)
+                ]
+            else:
+                self.parsers = [
+                    plugin_registry.get_plugin("parser", name) for name in plugins
+                ]
+            self.logger.debug(f"Initialized with {len(self.parsers)} parser plugins")
+            self._initialized = True
+    async def process(
         self,
-        text: str,
+        data: Union[str, Dict[str, Any], List[Dict[str, Any]]],
         timeout: Optional[float] = None,
         use_cache: bool = True,
         request_id: Optional[str] = None,
     ) -> List[ToolResult]:
         """
-        Process text to extract and execute tool calls.
+        Process tool calls from various input formats.
+        This method handles different input types:
+        - String: Parses tool calls from text using registered parsers
+        - Dict: Processes an OpenAI-style tool_calls object
+        - List[Dict]: Processes a list of individual tool calls
         Args:
-            text: Text to process.
-            timeout: Optional timeout for execution.
-            use_cache: Whether to use cached results.
-            request_id: Optional request ID for logging.
+            data: Input data containing tool calls
+            timeout: Optional timeout for execution
+            use_cache: Whether to use cached results
+            request_id: Optional request ID for logging
         Returns:
-            List of tool results.
+            List of tool results
         """
+        # Ensure initialization
+        await self.initialize()
         # Create request context
-        with request_logging(request_id) as req_id:
-            self.logger.debug(f"Processing text ({len(text)} chars)")
-            # Extract tool calls
-            calls = await self._extract_tool_calls(text)
+        async with request_logging(request_id) as req_id:
+            # Handle different input types
+            if isinstance(data, str):
+                # Text processing
+                self.logger.debug(f"Processing text ({len(data)} chars)")
+                calls = await self._extract_tool_calls(data)
+            elif isinstance(data, dict):
+                # Handle OpenAI format with tool_calls array
+                if "tool_calls" in data and isinstance(data["tool_calls"], list):
+                    calls = []
+                    for tc in data["tool_calls"]:
+                        if "function" in tc and isinstance(tc["function"], dict):
+                            function = tc["function"]
+                            name = function.get("name")
+                            args_str = function.get("arguments", "{}")
+                            # Parse arguments
+                            try:
+                                args = json.loads(args_str) if isinstance(args_str, str) else args_str
+                            except json.JSONDecodeError:
+                                args = {"raw": args_str}
+                            if name:
+                                calls.append(ToolCall(tool=name, arguments=args, id=tc.get("id")))
+                else:
+                    # Assume it's a single tool call
+                    calls = [ToolCall(**data)]
+            elif isinstance(data, list):
+                # List of tool calls
+                calls = [ToolCall(**tc) for tc in data]
+            else:
+                self.logger.warning(f"Unsupported input type: {type(data)}")
+                return []
             if not calls:
                 self.logger.debug("No tool calls found")
                 return []
             self.logger.debug(f"Found {len(calls)} tool calls")
             # Execute tool calls
-            with log_context_span("tool_execution", {"num_calls": len(calls)}):
+            async with log_context_span("tool_execution", {"num_calls": len(calls)}):
                 # Check if any tools are unknown
-                tool_names = {call.tool for call in calls}
-                unknown_tools = [name for name in tool_names if not self.registry.get_tool(name)]
+                unknown_tools = []
+                for call in calls:
+                    tool = await self.registry.get_tool(call.tool)
+                    if not tool:
+                        unknown_tools.append(call.tool)
                 if unknown_tools:
                     self.logger.warning(f"Unknown tools: {unknown_tools}")
                 # Execute tools
                 results = await self.executor.execute(calls, timeout=timeout)
                 # Log metrics for each tool call
                 for call, result in zip(calls, results):
-                    log_tool_call(call, result)
+                    await log_tool_call(call, result)
                     # Record metrics
                     duration = (result.end_time - result.start_time).total_seconds()
-                    metrics.log_tool_execution(
+                    await metrics.log_tool_execution(
                         tool=call.tool,
                         success=result.error is None,
                         duration=duration,
@@ -178,9 +278,64 @@ class ToolProcessor:
                         cached=getattr(result, "cached", False),
                         attempts=getattr(result, "attempts", 1),
                     )
                 return results
+    async def process_text(
+        self,
+        text: str,
+        timeout: Optional[float] = None,
+        use_cache: bool = True,
+        request_id: Optional[str] = None,
+    ) -> List[ToolResult]:
+        """
+        Process text to extract and execute tool calls.
+        Legacy alias for process() with string input.
+        Args:
+            text: Text to process.
+            timeout: Optional timeout for execution.
+            use_cache: Whether to use cached results.
+            request_id: Optional request ID for logging.
+        Returns:
+            List of tool results.
+        """
+        return await self.process(
+            data=text,
+            timeout=timeout,
+            use_cache=use_cache,
+            request_id=request_id,
+        )
+    async def execute(
+        self,
+        calls: List[ToolCall],
+        timeout: Optional[float] = None,
+        use_cache: bool = True,
+    ) -> List[ToolResult]:
+        """
+        Execute a list of ToolCall objects directly.
+        Args:
+            calls: List of tool calls to execute
+            timeout: Optional execution timeout
+            use_cache: Whether to use cached results
+        Returns:
+            List of tool results
+        """
+        # Ensure initialization
+        await self.initialize()
+        # Execute with the configured executor
+        return await self.executor.execute(
+            calls=calls,
+            timeout=timeout,
+            use_cache=use_cache if hasattr(self.executor, "use_cache") else True
+        )
     async def _extract_tool_calls(self, text: str) -> List[ToolCall]:
         """
         Extract tool calls from text using all available parsers.
@@ -194,39 +349,22 @@ class ToolProcessor:
         all_calls: List[ToolCall] = []
         # Try each parser
-        with log_context_span("parsing", {"text_length": len(text)}):
+        async with log_context_span("parsing", {"text_length": len(text)}):
+            parse_tasks = []
+            # Create parsing tasks
             for parser in self.parsers:
-                parser_name = parser.__class__.__name__
-                with log_context_span(f"parser.{parser_name}", log_duration=True):
-                    start_time = time.time()
-                    try:
-                        # Try to parse
-                        calls = parser.try_parse(text)
-                        # Log success
-                        duration = time.time() - start_time
-                        metrics.log_parser_metric(
-                            parser=parser_name,
-                            success=True,
-                            duration=duration,
-                            num_calls=len(calls),
-                        )
-                        # Add calls to result
-                        all_calls.extend(calls)
-                    except Exception as e:
-                        # Log failure
-                        duration = time.time() - start_time
-                        metrics.log_parser_metric(
-                            parser=parser_name,
-                            success=False,
-                            duration=duration,
-                            num_calls=0,
-                        )
-                        self.logger.error(f"Parser {parser_name} failed: {str(e)}")
+                parse_tasks.append(self._try_parser(parser, text))
+            # Execute all parsers concurrently
+            parser_results = await asyncio.gather(*parse_tasks, return_exceptions=True)
+            # Collect successful results
+            for result in parser_results:
+                if isinstance(result, Exception):
+                    continue
+                if result:
+                    all_calls.extend(result)
         # ------------------------------------------------------------------ #
         # Remove duplicates – use a stable digest instead of hashing a
@@ -243,11 +381,83 @@ class ToolProcessor:
             unique_calls[key] = call
         return list(unique_calls.values())
+    async def _try_parser(self, parser, text: str) -> List[ToolCall]:
+        """Try a single parser with metrics and logging."""
+        parser_name = parser.__class__.__name__
+        async with log_context_span(f"parser.{parser_name}", log_duration=True):
+            start_time = time.time()
+            try:
+                # Try to parse
+                calls = await parser.try_parse(text)
+                # Log success
+                duration = time.time() - start_time
+                await metrics.log_parser_metric(
+                    parser=parser_name,
+                    success=True,
+                    duration=duration,
+                    num_calls=len(calls),
+                )
+                return calls
+            except Exception as e:
+                # Log failure
+                duration = time.time() - start_time
+                await metrics.log_parser_metric(
+                    parser=parser_name,
+                    success=False,
+                    duration=duration,
+                    num_calls=0,
+                )
+                self.logger.error(f"Parser {parser_name} failed: {str(e)}")
+                return []
-# Create a global processor with default settings
-default_processor = ToolProcessor()
+# Create a global processor instance
+_global_processor: Optional[ToolProcessor] = None
+_processor_lock = asyncio.Lock()
+async def get_default_processor() -> ToolProcessor:
+    """Get or initialize the default global processor."""
+    global _global_processor
+    if _global_processor is None:
+        async with _processor_lock:
+            if _global_processor is None:
+                _global_processor = ToolProcessor()
+                await _global_processor.initialize()
+    return _global_processor
+async def process(
+    data: Union[str, Dict[str, Any], List[Dict[str, Any]]],
+    timeout: Optional[float] = None,
+    use_cache: bool = True,
+    request_id: Optional[str] = None,
+) -> List[ToolResult]:
+    """
+    Process tool calls with the default processor.
+    Args:
+        data: Input data (text, dict, or list of dicts)
+        timeout: Optional timeout for execution
+        use_cache: Whether to use cached results
+        request_id: Optional request ID for logging
+    Returns:
+        List of tool results
+    """
+    processor = await get_default_processor()
+    return await processor.process(
+        data=data,
+        timeout=timeout,
+        use_cache=use_cache,
+        request_id=request_id,
+    )
 async def process_text(
     text: str,
@@ -257,6 +467,8 @@ async def process_text(
 ) -> List[ToolResult]:
     """
     Process text with the default processor.
+    Legacy alias for backward compatibility.
     Args:
         text: Text to process.
@@ -267,7 +479,8 @@ async def process_text(
     Returns:
         List of tool results.
     """
-    return await default_processor.process_text(
+    processor = await get_default_processor()
+    return await processor.process_text(
         text=text,
         timeout=timeout,
         use_cache=use_cache,

chuk-tool-processor 0.1.6__py3-none-any.whl → 0.2__py3-none-any.whl

Potentially problematic release.

chuk-tool-processor 0.1.6py3-none-any.whl → 0.2py3-none-any.whl