PyPI - chuk-tool-processor - Versions diffs - 0.6.4__py3-none-any.whl → 0.9.7__py3-none-any.whl - Mend

chuk-tool-processor 0.6.4py3-none-any.whl → 0.9.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of chuk-tool-processor might be problematic. Click here for more details.

Files changed (66) hide show

chuk_tool_processor/core/__init__.py +32 -1
chuk_tool_processor/core/exceptions.py +225 -13
chuk_tool_processor/core/processor.py +135 -104
chuk_tool_processor/execution/strategies/__init__.py +6 -0
chuk_tool_processor/execution/strategies/inprocess_strategy.py +142 -150
chuk_tool_processor/execution/strategies/subprocess_strategy.py +202 -206
chuk_tool_processor/execution/tool_executor.py +82 -84
chuk_tool_processor/execution/wrappers/__init__.py +42 -0
chuk_tool_processor/execution/wrappers/caching.py +150 -116
chuk_tool_processor/execution/wrappers/circuit_breaker.py +370 -0
chuk_tool_processor/execution/wrappers/rate_limiting.py +76 -43
chuk_tool_processor/execution/wrappers/retry.py +116 -78
chuk_tool_processor/logging/__init__.py +23 -17
chuk_tool_processor/logging/context.py +40 -45
chuk_tool_processor/logging/formatter.py +22 -21
chuk_tool_processor/logging/helpers.py +28 -42
chuk_tool_processor/logging/metrics.py +13 -15
chuk_tool_processor/mcp/__init__.py +8 -12
chuk_tool_processor/mcp/mcp_tool.py +158 -114
chuk_tool_processor/mcp/register_mcp_tools.py +22 -22
chuk_tool_processor/mcp/setup_mcp_http_streamable.py +57 -17
chuk_tool_processor/mcp/setup_mcp_sse.py +57 -17
chuk_tool_processor/mcp/setup_mcp_stdio.py +11 -11
chuk_tool_processor/mcp/stream_manager.py +333 -276
chuk_tool_processor/mcp/transport/__init__.py +22 -29
chuk_tool_processor/mcp/transport/base_transport.py +180 -44
chuk_tool_processor/mcp/transport/http_streamable_transport.py +505 -325
chuk_tool_processor/mcp/transport/models.py +100 -0
chuk_tool_processor/mcp/transport/sse_transport.py +607 -276
chuk_tool_processor/mcp/transport/stdio_transport.py +597 -116
chuk_tool_processor/models/__init__.py +21 -1
chuk_tool_processor/models/execution_strategy.py +16 -21
chuk_tool_processor/models/streaming_tool.py +28 -25
chuk_tool_processor/models/tool_call.py +49 -31
chuk_tool_processor/models/tool_export_mixin.py +22 -8
chuk_tool_processor/models/tool_result.py +40 -77
chuk_tool_processor/models/tool_spec.py +350 -0
chuk_tool_processor/models/validated_tool.py +36 -18
chuk_tool_processor/observability/__init__.py +30 -0
chuk_tool_processor/observability/metrics.py +312 -0
chuk_tool_processor/observability/setup.py +105 -0
chuk_tool_processor/observability/tracing.py +345 -0
chuk_tool_processor/plugins/__init__.py +1 -1
chuk_tool_processor/plugins/discovery.py +11 -11
chuk_tool_processor/plugins/parsers/__init__.py +1 -1
chuk_tool_processor/plugins/parsers/base.py +1 -2
chuk_tool_processor/plugins/parsers/function_call_tool.py +13 -8
chuk_tool_processor/plugins/parsers/json_tool.py +4 -3
chuk_tool_processor/plugins/parsers/openai_tool.py +12 -7
chuk_tool_processor/plugins/parsers/xml_tool.py +4 -4
chuk_tool_processor/registry/__init__.py +12 -12
chuk_tool_processor/registry/auto_register.py +22 -30
chuk_tool_processor/registry/decorators.py +127 -129
chuk_tool_processor/registry/interface.py +26 -23
chuk_tool_processor/registry/metadata.py +27 -22
chuk_tool_processor/registry/provider.py +17 -18
chuk_tool_processor/registry/providers/__init__.py +16 -19
chuk_tool_processor/registry/providers/memory.py +18 -25
chuk_tool_processor/registry/tool_export.py +42 -51
chuk_tool_processor/utils/validation.py +15 -16
chuk_tool_processor-0.9.7.dist-info/METADATA +1813 -0
chuk_tool_processor-0.9.7.dist-info/RECORD +67 -0
chuk_tool_processor-0.6.4.dist-info/METADATA +0 -697
chuk_tool_processor-0.6.4.dist-info/RECORD +0 -60
{chuk_tool_processor-0.6.4.dist-info → chuk_tool_processor-0.9.7.dist-info}/WHEEL +0 -0
{chuk_tool_processor-0.6.4.dist-info → chuk_tool_processor-0.9.7.dist-info}/top_level.txt +0 -0

chuk_tool_processor/core/processor.py CHANGED Viewed

@@ -7,23 +7,28 @@ This module provides the central ToolProcessor class which handles:
 - Tool execution using configurable strategies
 - Application of execution wrappers (caching, retries, etc.)
 """
 from __future__ import annotations
 import asyncio
-import time
-import json
 import hashlib
-from typing import Any, Dict, List, Optional, Type, Union, Set
+import json
+import time
+from typing import Any
+from chuk_tool_processor.execution.strategies.inprocess_strategy import InProcessStrategy
+from chuk_tool_processor.execution.wrappers.caching import CachingToolExecutor, InMemoryCache
+from chuk_tool_processor.execution.wrappers.circuit_breaker import (
+    CircuitBreakerConfig,
+    CircuitBreakerExecutor,
+)
+from chuk_tool_processor.execution.wrappers.rate_limiting import RateLimitedToolExecutor, RateLimiter
+from chuk_tool_processor.execution.wrappers.retry import RetryableToolExecutor, RetryConfig
+from chuk_tool_processor.logging import get_logger, log_context_span, log_tool_call, metrics, request_logging
 from chuk_tool_processor.models.tool_call import ToolCall
 from chuk_tool_processor.models.tool_result import ToolResult
+from chuk_tool_processor.plugins.discovery import discover_default_plugins, plugin_registry
 from chuk_tool_processor.registry import ToolRegistryInterface, ToolRegistryProvider
-from chuk_tool_processor.execution.strategies.inprocess_strategy import InProcessStrategy
-from chuk_tool_processor.execution.wrappers.caching import CacheInterface, InMemoryCache, CachingToolExecutor
-from chuk_tool_processor.execution.wrappers.rate_limiting import RateLimiter, RateLimitedToolExecutor
-from chuk_tool_processor.execution.wrappers.retry import RetryConfig, RetryableToolExecutor
-from chuk_tool_processor.plugins.discovery import plugin_registry, discover_default_plugins
-from chuk_tool_processor.logging import get_logger, log_context_span, request_logging, log_tool_call, metrics
 class ToolProcessor:
@@ -34,18 +39,22 @@ class ToolProcessor:
     def __init__(
         self,
-        registry: Optional[ToolRegistryInterface] = None,
-        strategy = None,
+        registry: ToolRegistryInterface | None = None,
+        strategy=None,
         default_timeout: float = 10.0,
-        max_concurrency: Optional[int] = None,
+        max_concurrency: int | None = None,
         enable_caching: bool = True,
         cache_ttl: int = 300,
         enable_rate_limiting: bool = False,
-        global_rate_limit: Optional[int] = None,
-        tool_rate_limits: Optional[Dict[str, tuple]] = None,
+        global_rate_limit: int | None = None,
+        tool_rate_limits: dict[str, tuple] | None = None,
         enable_retries: bool = True,
         max_retries: int = 3,
-        parser_plugins: Optional[List[str]] = None,
+        retry_config: RetryConfig | None = None,
+        enable_circuit_breaker: bool = False,
+        circuit_breaker_threshold: int = 5,
+        circuit_breaker_timeout: float = 60.0,
+        parser_plugins: list[str] | None = None,
     ):
         """
         Initialize the tool processor.
@@ -62,11 +71,14 @@ class ToolProcessor:
             tool_rate_limits: Dict mapping tool names to (limit, period) tuples.
             enable_retries: Whether to enable automatic retries.
             max_retries: Maximum number of retry attempts.
+            enable_circuit_breaker: Whether to enable circuit breaker pattern.
+            circuit_breaker_threshold: Number of failures before opening circuit.
+            circuit_breaker_timeout: Seconds to wait before testing recovery.
             parser_plugins: List of parser plugin names to use.
                 If None, uses all available parsers.
         """
         self.logger = get_logger("chuk_tool_processor.processor")
         # Store initialization parameters for lazy initialization
         self._registry = registry
         self._strategy = strategy
@@ -79,14 +91,18 @@ class ToolProcessor:
         self.tool_rate_limits = tool_rate_limits
         self.enable_retries = enable_retries
         self.max_retries = max_retries
+        self.retry_config = retry_config
+        self.enable_circuit_breaker = enable_circuit_breaker
+        self.circuit_breaker_threshold = circuit_breaker_threshold
+        self.circuit_breaker_timeout = circuit_breaker_timeout
         self.parser_plugin_names = parser_plugins
         # Placeholder for initialized components
         self.registry = None
         self.strategy = None
         self.executor = None
         self.parsers = []
         # Flag for tracking initialization state
         self._initialized = False
         self._init_lock = asyncio.Lock()
@@ -94,28 +110,28 @@ class ToolProcessor:
     async def initialize(self) -> None:
         """
         Initialize the processor asynchronously.
         This method ensures all components are properly initialized before use.
         It is called automatically by other methods if needed.
         """
         # Fast path if already initialized
         if self._initialized:
             return
         # Ensure only one initialization happens at a time
         async with self._init_lock:
             # Double-check pattern after acquiring lock
             if self._initialized:
                 return
             self.logger.debug("Initializing tool processor")
             # Get the registry
             if self._registry is not None:
                 self.registry = self._registry
             else:
                 self.registry = await ToolRegistryProvider.get_registry()
             # Create execution strategy if needed
             if self._strategy is not None:
                 self.strategy = self._strategy
@@ -125,18 +141,32 @@ class ToolProcessor:
                     default_timeout=self.default_timeout,
                     max_concurrency=self.max_concurrency,
                 )
             # Set up the executor chain with optional wrappers
             executor = self.strategy
             # Apply wrappers in reverse order (innermost first)
+            # Circuit breaker goes innermost (closest to actual execution)
+            if self.enable_circuit_breaker:
+                self.logger.debug("Enabling circuit breaker")
+                circuit_config = CircuitBreakerConfig(
+                    failure_threshold=self.circuit_breaker_threshold,
+                    reset_timeout=self.circuit_breaker_timeout,
+                )
+                executor = CircuitBreakerExecutor(
+                    executor=executor,
+                    default_config=circuit_config,
+                )
             if self.enable_retries:
                 self.logger.debug("Enabling retry logic")
+                # Use custom retry config if provided, otherwise create default
+                retry_cfg = self.retry_config or RetryConfig(max_retries=self.max_retries)
                 executor = RetryableToolExecutor(
                     executor=executor,
-                    default_config=RetryConfig(max_retries=self.max_retries),
+                    default_config=retry_cfg,
                 )
             if self.enable_rate_limiting:
                 self.logger.debug("Enabling rate limiting")
                 rate_limiter = RateLimiter(
@@ -147,7 +177,7 @@ class ToolProcessor:
                     executor=executor,
                     limiter=rate_limiter,
                 )
             if self.enable_caching:
                 self.logger.debug("Enabling result caching")
                 cache = InMemoryCache(default_ttl=self.cache_ttl)
@@ -156,16 +186,16 @@ class ToolProcessor:
                     cache=cache,
                     default_ttl=self.cache_ttl,
                 )
             self.executor = executor
             # Initialize parser plugins
             # Discover plugins if not already done
             plugins = plugin_registry.list_plugins().get("parser", [])
             if not plugins:
                 discover_default_plugins()
                 plugins = plugin_registry.list_plugins().get("parser", [])
             # Get parser plugins
             if self.parser_plugin_names:
                 self.parsers = [
@@ -174,42 +204,40 @@ class ToolProcessor:
                     if plugin_registry.get_plugin("parser", name)
                 ]
             else:
-                self.parsers = [
-                    plugin_registry.get_plugin("parser", name) for name in plugins
-                ]
+                self.parsers = [plugin_registry.get_plugin("parser", name) for name in plugins]
             self.logger.debug(f"Initialized with {len(self.parsers)} parser plugins")
             self._initialized = True
     async def process(
         self,
-        data: Union[str, Dict[str, Any], List[Dict[str, Any]]],
-        timeout: Optional[float] = None,
-        use_cache: bool = True,
-        request_id: Optional[str] = None,
-    ) -> List[ToolResult]:
+        data: str | dict[str, Any] | list[dict[str, Any]],
+        timeout: float | None = None,
+        use_cache: bool = True,  # noqa: ARG002
+        request_id: str | None = None,
+    ) -> list[ToolResult]:
         """
         Process tool calls from various input formats.
         This method handles different input types:
         - String: Parses tool calls from text using registered parsers
         - Dict: Processes an OpenAI-style tool_calls object
         - List[Dict]: Processes a list of individual tool calls
         Args:
             data: Input data containing tool calls
             timeout: Optional timeout for execution
             use_cache: Whether to use cached results
             request_id: Optional request ID for logging
         Returns:
             List of tool results
         """
         # Ensure initialization
         await self.initialize()
         # Create request context
-        async with request_logging(request_id) as req_id:
+        async with request_logging(request_id):
             # Handle different input types
             if isinstance(data, str):
                 # Text processing
@@ -224,13 +252,13 @@ class ToolProcessor:
                             function = tc["function"]
                             name = function.get("name")
                             args_str = function.get("arguments", "{}")
                             # Parse arguments
                             try:
                                 args = json.loads(args_str) if isinstance(args_str, str) else args_str
                             except json.JSONDecodeError:
                                 args = {"raw": args_str}
                             if name:
                                 calls.append(ToolCall(tool=name, arguments=args, id=tc.get("id")))
                 else:
@@ -242,32 +270,34 @@ class ToolProcessor:
             else:
                 self.logger.warning(f"Unsupported input type: {type(data)}")
                 return []
             if not calls:
                 self.logger.debug("No tool calls found")
                 return []
             self.logger.debug(f"Found {len(calls)} tool calls")
             # Execute tool calls
             async with log_context_span("tool_execution", {"num_calls": len(calls)}):
-                # Check if any tools are unknown
+                # Check if any tools are unknown - search across all namespaces
                 unknown_tools = []
+                all_tools = await self.registry.list_tools()  # Returns list of (namespace, name) tuples
+                tool_names_in_registry = {name for ns, name in all_tools}
                 for call in calls:
-                    tool = await self.registry.get_tool(call.tool)
-                    if not tool:
+                    if call.tool not in tool_names_in_registry:
                         unknown_tools.append(call.tool)
                 if unknown_tools:
-                    self.logger.warning(f"Unknown tools: {unknown_tools}")
+                    self.logger.debug(f"Unknown tools: {unknown_tools}")
                 # Execute tools
                 results = await self.executor.execute(calls, timeout=timeout)
                 # Log metrics for each tool call
-                for call, result in zip(calls, results):
+                for call, result in zip(calls, results, strict=False):
                     await log_tool_call(call, result)
                     # Record metrics
                     duration = (result.end_time - result.start_time).total_seconds()
                     await metrics.log_tool_execution(
@@ -278,19 +308,19 @@ class ToolProcessor:
                         cached=getattr(result, "cached", False),
                         attempts=getattr(result, "attempts", 1),
                     )
                 return results
     async def process_text(
         self,
         text: str,
-        timeout: Optional[float] = None,
+        timeout: float | None = None,
         use_cache: bool = True,
-        request_id: Optional[str] = None,
-    ) -> List[ToolResult]:
+        request_id: str | None = None,
+    ) -> list[ToolResult]:
         """
         Process text to extract and execute tool calls.
         Legacy alias for process() with string input.
         Args:
@@ -308,35 +338,33 @@ class ToolProcessor:
             use_cache=use_cache,
             request_id=request_id,
         )
     async def execute(
         self,
-        calls: List[ToolCall],
-        timeout: Optional[float] = None,
+        calls: list[ToolCall],
+        timeout: float | None = None,
         use_cache: bool = True,
-    ) -> List[ToolResult]:
+    ) -> list[ToolResult]:
         """
         Execute a list of ToolCall objects directly.
         Args:
             calls: List of tool calls to execute
             timeout: Optional execution timeout
             use_cache: Whether to use cached results
         Returns:
             List of tool results
         """
         # Ensure initialization
         await self.initialize()
         # Execute with the configured executor
         return await self.executor.execute(
-            calls=calls,
-            timeout=timeout,
-            use_cache=use_cache if hasattr(self.executor, "use_cache") else True
+            calls=calls, timeout=timeout, use_cache=use_cache if hasattr(self.executor, "use_cache") else True
         )
-    async def _extract_tool_calls(self, text: str) -> List[ToolCall]:
+    async def _extract_tool_calls(self, text: str) -> list[ToolCall]:
         """
         Extract tool calls from text using all available parsers.
@@ -346,19 +374,19 @@ class ToolProcessor:
         Returns:
             List of tool calls.
         """
-        all_calls: List[ToolCall] = []
+        all_calls: list[ToolCall] = []
         # Try each parser
         async with log_context_span("parsing", {"text_length": len(text)}):
             parse_tasks = []
             # Create parsing tasks
             for parser in self.parsers:
                 parse_tasks.append(self._try_parser(parser, text))
             # Execute all parsers concurrently
             parser_results = await asyncio.gather(*parse_tasks, return_exceptions=True)
             # Collect successful results
             for result in parser_results:
                 if isinstance(result, Exception):
@@ -370,29 +398,29 @@ class ToolProcessor:
         # Remove duplicates - use a stable digest instead of hashing a
         # frozenset of argument items (which breaks on unhashable types).
         # ------------------------------------------------------------------ #
-        def _args_digest(args: Dict[str, Any]) -> str:
+        def _args_digest(args: dict[str, Any]) -> str:
             """Return a stable hash for any JSON-serialisable payload."""
             blob = json.dumps(args, sort_keys=True, default=str)
-            return hashlib.md5(blob.encode()).hexdigest()
+            return hashlib.md5(blob.encode(), usedforsecurity=False).hexdigest()  # nosec B324
-        unique_calls: Dict[str, ToolCall] = {}
+        unique_calls: dict[str, ToolCall] = {}
         for call in all_calls:
             key = f"{call.tool}:{_args_digest(call.arguments)}"
             unique_calls[key] = call
         return list(unique_calls.values())
-    async def _try_parser(self, parser, text: str) -> List[ToolCall]:
+    async def _try_parser(self, parser, text: str) -> list[ToolCall]:
         """Try a single parser with metrics and logging."""
         parser_name = parser.__class__.__name__
         async with log_context_span(f"parser.{parser_name}", log_duration=True):
             start_time = time.time()
             try:
                 # Try to parse
                 calls = await parser.try_parse(text)
                 # Log success
                 duration = time.time() - start_time
                 await metrics.log_parser_metric(
@@ -401,9 +429,9 @@ class ToolProcessor:
                     duration=duration,
                     num_calls=len(calls),
                 )
                 return calls
             except Exception as e:
                 # Log failure
                 duration = time.time() - start_time
@@ -413,41 +441,43 @@ class ToolProcessor:
                     duration=duration,
                     num_calls=0,
                 )
-                self.logger.error(f"Parser {parser_name} failed: {str(e)}")
+                self.logger.debug(f"Parser {parser_name} failed: {str(e)}")
                 return []
 # Create a global processor instance
-_global_processor: Optional[ToolProcessor] = None
+_global_processor: ToolProcessor | None = None
 _processor_lock = asyncio.Lock()
 async def get_default_processor() -> ToolProcessor:
     """Get or initialize the default global processor."""
     global _global_processor
     if _global_processor is None:
         async with _processor_lock:
             if _global_processor is None:
                 _global_processor = ToolProcessor()
                 await _global_processor.initialize()
     return _global_processor
 async def process(
-    data: Union[str, Dict[str, Any], List[Dict[str, Any]]],
-    timeout: Optional[float] = None,
+    data: str | dict[str, Any] | list[dict[str, Any]],
+    timeout: float | None = None,
     use_cache: bool = True,
-    request_id: Optional[str] = None,
-) -> List[ToolResult]:
+    request_id: str | None = None,
+) -> list[ToolResult]:
     """
     Process tool calls with the default processor.
     Args:
         data: Input data (text, dict, or list of dicts)
         timeout: Optional timeout for execution
         use_cache: Whether to use cached results
         request_id: Optional request ID for logging
     Returns:
         List of tool results
     """
@@ -459,15 +489,16 @@ async def process(
         request_id=request_id,
     )
 async def process_text(
     text: str,
-    timeout: Optional[float] = None,
+    timeout: float | None = None,
     use_cache: bool = True,
-    request_id: Optional[str] = None,
-) -> List[ToolResult]:
+    request_id: str | None = None,
+) -> list[ToolResult]:
     """
     Process text with the default processor.
     Legacy alias for backward compatibility.
     Args:
@@ -485,4 +516,4 @@ async def process_text(
         timeout=timeout,
         use_cache=use_cache,
         request_id=request_id,
-    )
+    )

chuk_tool_processor/execution/strategies/__init__.py CHANGED Viewed

@@ -0,0 +1,6 @@
+"""Execution strategies for tool processing."""
+from chuk_tool_processor.execution.strategies.inprocess_strategy import InProcessStrategy
+from chuk_tool_processor.execution.strategies.subprocess_strategy import SubprocessStrategy
+__all__ = ["InProcessStrategy", "SubprocessStrategy"]

chuk-tool-processor 0.6.4__py3-none-any.whl → 0.9.7__py3-none-any.whl

Potentially problematic release.

chuk-tool-processor 0.6.4py3-none-any.whl → 0.9.7py3-none-any.whl