PyPI - asap-protocol - Versions diffs - 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

asap-protocol 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

asap/__init__.py +1 -1
asap/errors.py +42 -0
asap/examples/coordinator.py +1 -1
asap/examples/echo_agent.py +1 -1
asap/models/constants.py +1 -0
asap/observability/metrics.py +1 -0
asap/transport/executors.py +156 -0
asap/transport/handlers.py +17 -5
asap/transport/middleware.py +298 -3
asap/transport/server.py +668 -274
{asap_protocol-0.1.0.dist-info → asap_protocol-0.3.0.dist-info}/METADATA +49 -73
{asap_protocol-0.1.0.dist-info → asap_protocol-0.3.0.dist-info}/RECORD +15 -14
{asap_protocol-0.1.0.dist-info → asap_protocol-0.3.0.dist-info}/WHEEL +0 -0
{asap_protocol-0.1.0.dist-info → asap_protocol-0.3.0.dist-info}/entry_points.txt +0 -0
{asap_protocol-0.1.0.dist-info → asap_protocol-0.3.0.dist-info}/licenses/LICENSE +0 -0

asap/__init__.py CHANGED Viewed

@@ -4,4 +4,4 @@ A streamlined, scalable, asynchronous protocol for agent-to-agent communication
 and task coordination.
 """
-__version__ = "0.1.0"
+__version__ = "0.3.0"

asap/errors.py CHANGED Viewed

@@ -148,3 +148,45 @@ class TaskAlreadyCompletedError(ASAPError):
         )
         self.task_id = task_id
         self.current_status = current_status
+class ThreadPoolExhaustedError(ASAPError):
+    """Raised when the thread pool is exhausted and cannot accept new tasks.
+    This error occurs when attempting to submit a synchronous handler
+    to a bounded thread pool that has reached its maximum capacity.
+    This prevents DoS attacks by limiting resource consumption.
+    Attributes:
+        max_threads: Maximum number of threads in the pool
+        active_threads: Current number of active threads
+    """
+    def __init__(
+        self,
+        max_threads: int,
+        active_threads: int,
+        details: dict[str, Any] | None = None,
+    ) -> None:
+        """Initialize thread pool exhausted error.
+        Args:
+            max_threads: Maximum number of threads in the pool
+            active_threads: Current number of active threads
+            details: Optional additional context
+        """
+        message = (
+            f"Thread pool exhausted: {active_threads}/{max_threads} threads in use. "
+            "Service temporarily unavailable."
+        )
+        super().__init__(
+            code="asap:transport/thread_pool_exhausted",
+            message=message,
+            details={
+                "max_threads": max_threads,
+                "active_threads": active_threads,
+                **(details or {}),
+            },
+        )
+        self.max_threads = max_threads
+        self.active_threads = active_threads

asap/examples/coordinator.py CHANGED Viewed

@@ -21,7 +21,7 @@ from asap.transport.server import create_app
 DEFAULT_AGENT_ID = "urn:asap:agent:coordinator"
 DEFAULT_AGENT_NAME = "Coordinator Agent"
-DEFAULT_AGENT_VERSION = "0.1.0"
+DEFAULT_AGENT_VERSION = "0.3.0"
 DEFAULT_AGENT_DESCRIPTION = "Coordinates tasks across agents"
 DEFAULT_ASAP_ENDPOINT = "http://localhost:8000/asap"
 DEFAULT_ECHO_AGENT_ID = "urn:asap:agent:echo-agent"

asap/examples/echo_agent.py CHANGED Viewed

@@ -16,7 +16,7 @@ from asap.transport.server import create_app
 DEFAULT_AGENT_ID = "urn:asap:agent:echo-agent"
 DEFAULT_AGENT_NAME = "Echo Agent"
-DEFAULT_AGENT_VERSION = "0.1.0"
+DEFAULT_AGENT_VERSION = "0.3.0"
 DEFAULT_AGENT_DESCRIPTION = "Echoes task input as output"
 DEFAULT_ASAP_HOST = "127.0.0.1"
 DEFAULT_ASAP_PORT = 8001

asap/models/constants.py CHANGED Viewed

@@ -9,6 +9,7 @@ ASAP_PROTOCOL_VERSION = "0.1"
 # Default configuration values
 DEFAULT_TIMEOUT_SECONDS = 600
 MAX_TASK_DEPTH = 10  # Maximum nesting level for subtasks
+MAX_REQUEST_SIZE = 10 * 1024 * 1024  # 10MB maximum request size
 # URN patterns
 AGENT_URN_PATTERN = r"^urn:asap:agent:[a-z0-9-]+(?::[a-z0-9-]+)?$"

asap/observability/metrics.py CHANGED Viewed

@@ -155,6 +155,7 @@ class MetricsCollector:
         "asap_requests_total": "Total number of ASAP requests received",
         "asap_requests_success_total": "Total number of successful ASAP requests",
         "asap_requests_error_total": "Total number of failed ASAP requests",
+        "asap_thread_pool_exhausted_total": "Total number of thread pool exhaustion events",
     }
     DEFAULT_HISTOGRAMS: ClassVar[dict[str, str]] = {

asap/transport/executors.py ADDED Viewed

@@ -0,0 +1,156 @@
+"""Bounded thread pool executor for DoS prevention.
+This module provides a bounded executor that limits the number of concurrent
+threads used for executing synchronous handlers. This prevents resource
+exhaustion attacks by rejecting requests when the thread pool is full.
+Example:
+    >>> from asap.transport.executors import BoundedExecutor
+    >>> executor = BoundedExecutor(max_threads=10)
+    >>> result = await loop.run_in_executor(executor, sync_handler, arg1, arg2)
+"""
+import os
+from concurrent.futures import Executor, Future, ThreadPoolExecutor
+from threading import Semaphore
+from typing import Callable, TypeVar
+from asap.errors import ThreadPoolExhaustedError
+from asap.observability import get_logger, get_metrics
+# Module logger
+logger = get_logger(__name__)
+# Type variable for function return type
+T = TypeVar("T")
+class BoundedExecutor(Executor):
+    """Thread pool executor with bounded capacity for DoS prevention.
+    This executor wraps a ThreadPoolExecutor and uses a semaphore to limit
+    the number of concurrent tasks. When the limit is reached, submitting
+    a new task raises ThreadPoolExhaustedError instead of queuing indefinitely.
+    The executor prevents resource exhaustion by:
+    - Limiting concurrent thread usage
+    - Rejecting new tasks when capacity is reached (fail-fast)
+    - Recording metrics for monitoring
+    Attributes:
+        _executor: Underlying ThreadPoolExecutor
+        _semaphore: Semaphore controlling concurrent access
+        max_threads: Maximum number of concurrent threads
+    Example:
+        >>> executor = BoundedExecutor(max_threads=10)
+        >>> result = await loop.run_in_executor(executor, my_sync_function, arg1)
+    """
+    def __init__(self, max_threads: int | None = None) -> None:
+        """Initialize bounded executor.
+        Args:
+            max_threads: Maximum number of concurrent threads.
+                Defaults to min(32, os.cpu_count() + 4) if None.
+        Raises:
+            ValueError: If max_threads is less than 1
+        """
+        if max_threads is None:
+            # Default: min(32, cpu_count + 4) following asyncio convention
+            cpu_count = os.cpu_count() or 1
+            max_threads = min(32, cpu_count + 4)
+        if max_threads < 1:
+            raise ValueError(f"max_threads must be >= 1, got {max_threads}")
+        self.max_threads = max_threads
+        self._executor = ThreadPoolExecutor(max_workers=max_threads)
+        self._semaphore = Semaphore(max_threads)
+        logger.info(
+            "asap.executor.created",
+            max_threads=max_threads,
+            cpu_count=os.cpu_count(),
+        )
+    def submit(self, fn: Callable[..., T], /, *args: object, **kwargs: object) -> Future[T]:
+        """Submit a function to be executed in the thread pool.
+        This method acquires a semaphore permit before submitting to the
+        executor. If no permit is available (pool is full), it raises
+        ThreadPoolExhaustedError instead of blocking.
+        The returned Future will automatically release the semaphore permit
+        when the task completes (successfully or with an error).
+        Args:
+            fn: Function to execute
+            *args: Positional arguments for the function
+            **kwargs: Keyword arguments for the function
+        Returns:
+            Future representing the execution of the function
+        Raises:
+            ThreadPoolExhaustedError: If thread pool is exhausted
+        Note:
+            This method returns immediately with a Future. The function
+            execution happens asynchronously in the thread pool.
+        """
+        # Try to acquire semaphore (non-blocking check)
+        if not self._semaphore.acquire(blocking=False):
+            # Pool is exhausted - record metric and raise error
+            # We know the pool is full since acquire failed, so active_threads = max_threads
+            active_threads = self.max_threads
+            metrics = get_metrics()
+            metrics.increment_counter(
+                "asap_thread_pool_exhausted_total",
+                labels={},
+                value=1.0,
+            )
+            logger.warning(
+                "asap.executor.exhausted",
+                max_threads=self.max_threads,
+                active_threads=active_threads,
+            )
+            raise ThreadPoolExhaustedError(
+                max_threads=self.max_threads,
+                active_threads=active_threads,
+            )
+        # Submit to executor
+        future = self._executor.submit(fn, *args, **kwargs)
+        # Wrap future to release semaphore when done
+        def release_on_done(f: Future[T]) -> None:
+            """Release semaphore permit when future completes."""
+            # Future is already done when callback is called, just release semaphore
+            self._semaphore.release()
+        # Add callback to release semaphore when future completes
+        future.add_done_callback(release_on_done)
+        return future
+    def shutdown(self, wait: bool = True, *, cancel_futures: bool = False) -> None:
+        """Shutdown the executor and release resources.
+        Args:
+            wait: If True, wait for all pending tasks to complete
+            cancel_futures: If True, cancel pending futures (Python 3.9+)
+        """
+        self._executor.shutdown(wait=wait, cancel_futures=cancel_futures)
+        logger.info("asap.executor.shutdown", max_threads=self.max_threads)
+    def __enter__(self) -> "BoundedExecutor":
+        """Context manager entry."""
+        return self
+    def __exit__(self, exc_type: object, exc_val: object, exc_tb: object) -> None:
+        """Context manager exit - shutdown executor."""
+        self.shutdown(wait=True)

asap/transport/handlers.py CHANGED Viewed

@@ -30,8 +30,9 @@ import asyncio
 import inspect
 import time
 from collections.abc import Awaitable
+from concurrent.futures import Executor
 from threading import RLock
-from typing import Protocol
+from typing import Protocol, cast
 from asap.errors import ASAPError
 from asap.models.entities import Manifest
@@ -142,6 +143,7 @@ class HandlerRegistry:
     Attributes:
         _handlers: Internal mapping of payload_type to handler function
         _lock: Reentrant lock for thread-safe operations
+        _executor: Optional executor for running sync handlers (for DoS prevention)
     Example:
         >>> registry = HandlerRegistry()
@@ -151,10 +153,17 @@ class HandlerRegistry:
         >>> response = registry.dispatch(envelope, manifest)
     """
-    def __init__(self) -> None:
-        """Initialize empty handler registry with thread-safe lock."""
+    def __init__(self, executor: Executor | None = None) -> None:
+        """Initialize empty handler registry with thread-safe lock.
+        Args:
+            executor: Optional executor for running sync handlers.
+                If None, uses default asyncio executor (unbounded).
+                Should be a BoundedExecutor instance for DoS prevention.
+        """
         self._handlers: dict[str, Handler] = {}
         self._lock = RLock()
+        self._executor: Executor | None = executor
     def register(self, payload_type: str, handler: Handler) -> None:
         """Register a handler for a payload type.
@@ -333,13 +342,16 @@ class HandlerRegistry:
                 # Sync handler - run in thread pool to avoid blocking event loop
                 # Also handle async callable objects that return awaitables
                 loop = asyncio.get_event_loop()
-                result: object = await loop.run_in_executor(None, handler, envelope, manifest)
+                # Use bounded executor if provided, otherwise use default (unbounded)
+                executor = self._executor if self._executor is not None else None
+                result: object = await loop.run_in_executor(executor, handler, envelope, manifest)
                 # Check if result is awaitable (handles async __call__ methods)
                 if inspect.isawaitable(result):
                     response = await result
                 else:
                     # Type narrowing: result is Envelope for sync handlers
-                    response = result  # type: ignore[assignment]
+                    # After checking it's not awaitable, we know it's Envelope
+                    response = cast(Envelope, result)
             duration_ms = (time.perf_counter() - start_time) * 1000
             logger.debug(

asap/transport/middleware.py CHANGED Viewed

@@ -1,10 +1,11 @@
-"""Authentication middleware for ASAP protocol server.
+"""Authentication and rate limiting middleware for ASAP protocol server.
-This module provides authentication middleware that:
+This module provides middleware that:
 - Validates Bearer tokens based on manifest configuration
 - Verifies sender identity matches authenticated agent
 - Supports custom token validation logic
 - Returns proper JSON-RPC error responses for auth failures
+- Implements IP-based rate limiting to prevent DoS attacks
 Example:
     >>> from asap.transport.middleware import AuthenticationMiddleware, BearerTokenValidator
@@ -32,10 +33,17 @@ Example:
 """
 import hashlib
-from typing import Callable, Protocol
+import uuid
+from typing import Any, Awaitable, Callable, Protocol
+from collections.abc import Sequence
 from fastapi import HTTPException, Request
+from fastapi.responses import JSONResponse
 from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
+from slowapi import Limiter
+from slowapi.errors import RateLimitExceeded
+from slowapi.util import get_remote_address
+from starlette.middleware.base import BaseHTTPMiddleware
 from asap.models.entities import Manifest
 from asap.observability import get_logger
@@ -45,14 +53,215 @@ logger = get_logger(__name__)
 # Authentication header scheme
 AUTH_SCHEME_BEARER = "bearer"
+# Rate limiting default configuration
+DEFAULT_RATE_LIMIT = "100/minute"
+def _get_sender_from_envelope(request: Request) -> str:
+    """Extract identifier from request for rate limiting.
+    This function implements IP-based rate limiting for the transport layer.
+    The rate limiter executes before the route handler parses the request body,
+    so the ASAP envelope is not yet available at rate limit check time.
+    Therefore, this function primarily returns the client IP address.
+    The function attempts to extract the sender from the envelope if already
+    parsed (for future compatibility), but in practice always falls back to
+    the client IP address. This IP-based approach is safer for DoS prevention
+    as it doesn't require parsing the request body before rate limiting.
+    Args:
+        request: FastAPI request object
+    Returns:
+        Client IP address (used as rate limiting key)
+    Example:
+        >>> sender = _get_sender_from_envelope(request)
+        >>> # Returns "192.168.1.1" (IP address, not sender URN)
+    """
+    # Try to extract sender from envelope if already parsed (early returns reduce complexity)
+    try:
+        # Check if envelope is stored in request state (after parsing)
+        if hasattr(request.state, "envelope") and request.state.envelope:
+            envelope = request.state.envelope
+            if hasattr(envelope, "sender") and isinstance(envelope.sender, str):
+                return envelope.sender
+        # Try to extract from JSON-RPC request if already parsed
+        if hasattr(request.state, "rpc_request"):
+            rpc_request = request.state.rpc_request
+            if (
+                hasattr(rpc_request, "params")
+                and isinstance(rpc_request.params, dict)
+                and "envelope" in rpc_request.params
+            ):
+                envelope_data = rpc_request.params.get("envelope")
+                if isinstance(envelope_data, dict) and "sender" in envelope_data:
+                    sender = envelope_data["sender"]
+                    if isinstance(sender, str):
+                        return sender
+    except (AttributeError, KeyError, TypeError):
+        # Envelope not available, fall back to IP
+        pass
+    # Fallback to client IP address
+    remote_addr = get_remote_address(request)
+    # Type narrowing: get_remote_address returns str, but mypy may see it as Any
+    if isinstance(remote_addr, str):
+        return remote_addr
+    return str(remote_addr)
+# Create rate limiter instance with IP-based key function
+# Note: The key function attempts to extract sender but always falls back to IP
+# because rate limiting executes before request body parsing
+limiter = Limiter(
+    key_func=_get_sender_from_envelope,
+    default_limits=[DEFAULT_RATE_LIMIT],
+    storage_uri="memory://",
+)
+def create_test_limiter(limits: Sequence[str] | None = None) -> Limiter:
+    """Create a new limiter instance for testing isolation.
+    This allows tests to use isolated rate limiters to avoid interference
+    between test cases.
+    Args:
+        limits: Optional list of rate limit strings. Defaults to high limits for testing.
+    Returns:
+        New Limiter instance with isolated storage
+    Example:
+        >>> test_limiter = create_test_limiter(["100000/minute"])
+        >>> app.state.limiter = test_limiter
+    """
+    if limits is None:
+        limits = ["100000/minute"]  # Very high limit for testing
+    # Use unique storage URI to ensure complete isolation between test instances
+    unique_storage_id = str(uuid.uuid4())
+    return Limiter(
+        key_func=_get_sender_from_envelope,
+        default_limits=list(limits),
+        storage_uri=f"memory://{unique_storage_id}",  # Each instance gets its own memory storage
+    )
+def create_limiter(limits: Sequence[str] | None = None) -> Limiter:
+    """Create a new limiter instance for production use.
+    Creates an isolated limiter instance with its own storage, allowing
+    multiple FastAPI app instances to have independent rate limiters.
+    Args:
+        limits: Optional list of rate limit strings (e.g., ["100/minute"]).
+            Defaults to DEFAULT_RATE_LIMIT if not provided.
+    Returns:
+        New Limiter instance with isolated storage
+    Example:
+        >>> limiter = create_limiter(["100/minute"])
+        >>> app.state.limiter = limiter
+    """
+    if limits is None:
+        limits = [DEFAULT_RATE_LIMIT]
+    # Use unique storage URI to ensure isolation between app instances
+    unique_storage_id = str(uuid.uuid4())
+    return Limiter(
+        key_func=_get_sender_from_envelope,
+        default_limits=list(limits),
+        storage_uri=f"memory://{unique_storage_id}",
+    )
+def rate_limit_handler(request: Request, exc: Exception) -> JSONResponse:
+    """Handle rate limit exceeded exceptions with JSON-RPC formatted error.
+    Returns a JSON-RPC 2.0 compliant error response with HTTP 429 status
+    and Retry-After header indicating when the client can retry.
+    Args:
+        request: FastAPI request object
+        exc: RateLimitExceeded exception (typed as Exception for FastAPI compatibility)
+    Returns:
+        JSONResponse with JSON-RPC error format and 429 status code
+    Example:
+        >>> response = rate_limit_handler(request, exc)
+        >>> # Returns JSONResponse with status_code=429 and JSON-RPC error
+    """
+    # Type narrowing: FastAPI passes RateLimitExceeded but handler signature uses Exception
+    if not isinstance(exc, RateLimitExceeded):
+        # Fallback for unexpected exception types
+        logger.warning("asap.rate_limit.unexpected_exception", exc_type=type(exc).__name__)
+        return JSONResponse(
+            status_code=HTTP_TOO_MANY_REQUESTS,
+            content={
+                "jsonrpc": "2.0",
+                "id": getattr(request.state, "request_id", None),
+                "error": {
+                    "code": HTTP_TOO_MANY_REQUESTS,
+                    "message": ERROR_RATE_LIMIT_EXCEEDED,
+                },
+            },
+        )
+    # Calculate retry_after from exception or use default
+    retry_after = 60  # Default to 60 seconds
+    if hasattr(exc, "retry_after") and exc.retry_after is not None:
+        try:
+            retry_after = int(exc.retry_after)
+        except (ValueError, TypeError):
+            retry_after = 60
+    # Get limit information if available
+    limit_str = DEFAULT_RATE_LIMIT
+    if hasattr(exc, "limit") and exc.limit is not None:
+        limit_str = str(exc.limit)
+    logger.warning(
+        "asap.rate_limit.exceeded",
+        sender=_get_sender_from_envelope(request),
+        retry_after=retry_after,
+        limit=limit_str,
+    )
+    # Return JSON-RPC 2.0 formatted error response
+    return JSONResponse(
+        status_code=HTTP_TOO_MANY_REQUESTS,
+        content={
+            "jsonrpc": "2.0",
+            "id": getattr(request.state, "request_id", None),
+            "error": {
+                "code": HTTP_TOO_MANY_REQUESTS,
+                "message": ERROR_RATE_LIMIT_EXCEEDED,
+                "data": {
+                    "retry_after": retry_after,
+                    "limit": limit_str,
+                },
+            },
+        },
+        headers={"Retry-After": str(retry_after)},
+    )
 # HTTP status codes
 HTTP_UNAUTHORIZED = 401
 HTTP_FORBIDDEN = 403
+HTTP_TOO_MANY_REQUESTS = 429
 # Error messages
 ERROR_AUTH_REQUIRED = "Authentication required"
 ERROR_INVALID_TOKEN = "Invalid authentication token"
 ERROR_SENDER_MISMATCH = "Sender does not match authenticated identity"
+ERROR_RATE_LIMIT_EXCEEDED = "Rate limit exceeded"
 class TokenValidator(Protocol):
@@ -357,3 +566,89 @@ class AuthenticationMiddleware:
             "asap.auth.sender_verified",
             authenticated_agent=authenticated_agent_id,
         )
+class SizeLimitMiddleware(BaseHTTPMiddleware):
+    """Middleware to validate request size before routing.
+    This middleware checks the Content-Length header and rejects requests
+    that exceed the maximum allowed size before any routing logic executes.
+    This provides early rejection and prevents unnecessary processing.
+    The middleware validates the Content-Length header only. Actual body
+    size validation during parsing (with streaming) is handled in the
+    route handler to prevent OOM attacks.
+    Attributes:
+        max_size: Maximum allowed request size in bytes
+    Example:
+        >>> from asap.transport.middleware import SizeLimitMiddleware
+        >>> app.add_middleware(SizeLimitMiddleware, max_size=10 * 1024 * 1024)
+    """
+    def __init__(self, app: Any, max_size: int) -> None:
+        """Initialize size limit middleware.
+        Args:
+            app: The ASGI application
+            max_size: Maximum allowed request size in bytes
+        Raises:
+            ValueError: If max_size is less than 1
+        """
+        if max_size < 1:
+            raise ValueError(f"max_size must be >= 1, got {max_size}")
+        super().__init__(app)
+        self.max_size = max_size
+    async def dispatch(
+        self, request: Request, call_next: Callable[[Request], Awaitable[Any]]
+    ) -> Any:
+        """Process request and validate size before routing.
+        Args:
+            request: FastAPI request object
+            call_next: Next middleware or route handler
+        Returns:
+            Response from next handler or error response if size exceeded
+        """
+        # Check Content-Length header if present
+        content_length = request.headers.get("content-length")
+        if content_length:
+            try:
+                size = int(content_length)
+                if size > self.max_size:
+                    logger.warning(
+                        "asap.request.size_exceeded",
+                        content_length=size,
+                        max_size=self.max_size,
+                    )
+                    # Return JSON response directly (middleware runs before route handlers)
+                    return JSONResponse(
+                        status_code=413,
+                        content={
+                            "detail": f"Request size ({size} bytes) exceeds maximum ({self.max_size} bytes)"
+                        },
+                    )
+            except ValueError:
+                # Invalid Content-Length header, let route handler validate actual body size
+                pass
+        # Continue to next middleware or route handler
+        return await call_next(request)
+# Export rate limiting components
+__all__ = [
+    "AuthenticationMiddleware",
+    "BearerTokenValidator",
+    "TokenValidator",
+    "SizeLimitMiddleware",
+    "limiter",
+    "rate_limit_handler",
+    "create_limiter",
+    "create_test_limiter",
+    "_get_sender_from_envelope",
+]

asap-protocol 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

asap-protocol 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl