PyPI - sandboxy - Versions diffs - 0.0.1__py3-none-any.whl - Mend

sandboxy 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

sandboxy/__init__.py +3 -0
sandboxy/agents/__init__.py +21 -0
sandboxy/agents/base.py +66 -0
sandboxy/agents/llm_prompt.py +308 -0
sandboxy/agents/loader.py +222 -0
sandboxy/api/__init__.py +5 -0
sandboxy/api/app.py +76 -0
sandboxy/api/routes/__init__.py +1 -0
sandboxy/api/routes/agents.py +92 -0
sandboxy/api/routes/local.py +1388 -0
sandboxy/api/routes/tools.py +106 -0
sandboxy/cli/__init__.py +1 -0
sandboxy/cli/main.py +1196 -0
sandboxy/cli/type_detector.py +48 -0
sandboxy/config.py +49 -0
sandboxy/core/__init__.py +1 -0
sandboxy/core/async_runner.py +824 -0
sandboxy/core/mdl_parser.py +441 -0
sandboxy/core/runner.py +599 -0
sandboxy/core/safe_eval.py +165 -0
sandboxy/core/state.py +234 -0
sandboxy/datasets/__init__.py +20 -0
sandboxy/datasets/loader.py +193 -0
sandboxy/datasets/runner.py +442 -0
sandboxy/errors.py +166 -0
sandboxy/local/context.py +235 -0
sandboxy/local/results.py +173 -0
sandboxy/logging.py +31 -0
sandboxy/mcp/__init__.py +25 -0
sandboxy/mcp/client.py +360 -0
sandboxy/mcp/wrapper.py +99 -0
sandboxy/providers/__init__.py +34 -0
sandboxy/providers/anthropic_provider.py +271 -0
sandboxy/providers/base.py +123 -0
sandboxy/providers/http_client.py +101 -0
sandboxy/providers/openai_provider.py +282 -0
sandboxy/providers/openrouter.py +958 -0
sandboxy/providers/registry.py +199 -0
sandboxy/scenarios/__init__.py +11 -0
sandboxy/scenarios/comparison.py +491 -0
sandboxy/scenarios/loader.py +262 -0
sandboxy/scenarios/runner.py +468 -0
sandboxy/scenarios/unified.py +1434 -0
sandboxy/session/__init__.py +21 -0
sandboxy/session/manager.py +278 -0
sandboxy/tools/__init__.py +34 -0
sandboxy/tools/base.py +127 -0
sandboxy/tools/loader.py +270 -0
sandboxy/tools/yaml_tools.py +708 -0
sandboxy/ui/__init__.py +27 -0
sandboxy/ui/dist/assets/index-CgAkYWrJ.css +1 -0
sandboxy/ui/dist/assets/index-D4zoGFcr.js +347 -0
sandboxy/ui/dist/index.html +14 -0
sandboxy/utils/__init__.py +3 -0
sandboxy/utils/time.py +20 -0
sandboxy-0.0.1.dist-info/METADATA +241 -0
sandboxy-0.0.1.dist-info/RECORD +60 -0
sandboxy-0.0.1.dist-info/WHEEL +4 -0
sandboxy-0.0.1.dist-info/entry_points.txt +3 -0
sandboxy-0.0.1.dist-info/licenses/LICENSE +201 -0

sandboxy/providers/anthropic_provider.py ADDED Viewed

@@ -0,0 +1,271 @@
+"""Direct Anthropic provider."""
+import os
+import time
+from collections.abc import AsyncIterator
+from typing import Any
+from sandboxy.providers.base import BaseProvider, ModelInfo, ModelResponse, ProviderError
+ANTHROPIC_MODELS = {
+    # Claude 4.5 Series (latest)
+    "claude-opus-4-5-20251101": ModelInfo(
+        id="claude-opus-4-5-20251101",
+        name="Claude Opus 4.5",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=15.00,
+        output_cost_per_million=75.00,
+        supports_vision=True,
+    ),
+    "claude-haiku-4-5-20251101": ModelInfo(
+        id="claude-haiku-4-5-20251101",
+        name="Claude Haiku 4.5",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=0.80,
+        output_cost_per_million=4.00,
+        supports_vision=True,
+    ),
+    # Claude 4 Series
+    "claude-sonnet-4-20250514": ModelInfo(
+        id="claude-sonnet-4-20250514",
+        name="Claude Sonnet 4",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=3.00,
+        output_cost_per_million=15.00,
+        supports_vision=True,
+    ),
+    "claude-opus-4-20250514": ModelInfo(
+        id="claude-opus-4-20250514",
+        name="Claude Opus 4",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=15.00,
+        output_cost_per_million=75.00,
+        supports_vision=True,
+    ),
+    # Claude 3.5 Series
+    "claude-3-5-sonnet-20241022": ModelInfo(
+        id="claude-3-5-sonnet-20241022",
+        name="Claude 3.5 Sonnet",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=3.00,
+        output_cost_per_million=15.00,
+        supports_vision=True,
+    ),
+    "claude-3-5-haiku-20241022": ModelInfo(
+        id="claude-3-5-haiku-20241022",
+        name="Claude 3.5 Haiku",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=0.80,
+        output_cost_per_million=4.00,
+        supports_vision=True,
+    ),
+    # Claude 3 Series (legacy)
+    "claude-3-opus-20240229": ModelInfo(
+        id="claude-3-opus-20240229",
+        name="Claude 3 Opus",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=15.00,
+        output_cost_per_million=75.00,
+        supports_vision=True,
+    ),
+    "claude-3-haiku-20240307": ModelInfo(
+        id="claude-3-haiku-20240307",
+        name="Claude 3 Haiku",
+        provider="anthropic",
+        context_length=200000,
+        input_cost_per_million=0.25,
+        output_cost_per_million=1.25,
+        supports_vision=True,
+    ),
+}
+# Aliases for common model names
+MODEL_ALIASES = {
+    # Claude 4.5
+    "claude-opus-4.5": "claude-opus-4-5-20251101",
+    "claude-opus-4-5": "claude-opus-4-5-20251101",
+    "claude-haiku-4.5": "claude-haiku-4-5-20251101",
+    "claude-haiku-4-5": "claude-haiku-4-5-20251101",
+    # Claude 4
+    "claude-sonnet-4": "claude-sonnet-4-20250514",
+    "claude-opus-4": "claude-opus-4-20250514",
+    # Claude 3.5
+    "claude-3.5-sonnet": "claude-3-5-sonnet-20241022",
+    "claude-3-5-sonnet": "claude-3-5-sonnet-20241022",
+    "claude-3.5-haiku": "claude-3-5-haiku-20241022",
+    "claude-3-5-haiku": "claude-3-5-haiku-20241022",
+    # Claude 3
+    "claude-3-opus": "claude-3-opus-20240229",
+    "claude-3-haiku": "claude-3-haiku-20240307",
+}
+class AnthropicProvider(BaseProvider):
+    """Direct Anthropic API provider.
+    Use this when you have an Anthropic API key and want to call
+    Claude models directly.
+    """
+    provider_name = "anthropic"
+    def __init__(self, api_key: str | None = None):
+        """Initialize Anthropic provider.
+        Args:
+            api_key: Anthropic API key. If not provided, reads from
+                     ANTHROPIC_API_KEY environment variable.
+        """
+        self.api_key = api_key or os.getenv("ANTHROPIC_API_KEY")
+        if not self.api_key:
+            raise ProviderError(
+                "API key required. Set ANTHROPIC_API_KEY or pass api_key.",
+                provider=self.provider_name,
+            )
+        # Lazy import to avoid requiring anthropic package if not used
+        try:
+            from anthropic import AsyncAnthropic
+            self.client = AsyncAnthropic(api_key=self.api_key)
+        except ImportError as e:
+            raise ProviderError(
+                "anthropic package required. Install with: pip install anthropic",
+                provider=self.provider_name,
+            ) from e
+    def _resolve_model(self, model: str) -> str:
+        """Resolve model alias to full model ID."""
+        return MODEL_ALIASES.get(model, model)
+    async def complete(
+        self,
+        model: str,
+        messages: list[dict[str, Any]],
+        temperature: float = 0.7,
+        max_tokens: int = 1024,
+        **kwargs: Any,
+    ) -> ModelResponse:
+        """Send completion request to Anthropic."""
+        start_time = time.time()
+        resolved_model = self._resolve_model(model)
+        # Convert from OpenAI format to Anthropic format
+        system_prompt = None
+        anthropic_messages = []
+        for msg in messages:
+            if msg["role"] == "system":
+                system_prompt = msg["content"]
+            else:
+                anthropic_messages.append(
+                    {
+                        "role": msg["role"],
+                        "content": msg["content"],
+                    }
+                )
+        try:
+            response = await self.client.messages.create(
+                model=resolved_model,
+                messages=anthropic_messages,
+                system=system_prompt or "",
+                temperature=temperature,
+                max_tokens=max_tokens,
+                **kwargs,
+            )
+        except Exception as e:
+            raise ProviderError(
+                str(e),
+                provider=self.provider_name,
+                model=model,
+            ) from e
+        latency_ms = int((time.time() - start_time) * 1000)
+        # Extract content from response
+        content = ""
+        for block in response.content:
+            if block.type == "text":
+                content += block.text
+        input_tokens = response.usage.input_tokens
+        output_tokens = response.usage.output_tokens
+        cost = self._calculate_cost(resolved_model, input_tokens, output_tokens)
+        return ModelResponse(
+            content=content,
+            model_id=response.model,
+            latency_ms=latency_ms,
+            input_tokens=input_tokens,
+            output_tokens=output_tokens,
+            cost_usd=cost,
+            finish_reason=response.stop_reason,
+            raw_response=response.model_dump(),
+        )
+    async def stream(
+        self,
+        model: str,
+        messages: list[dict[str, Any]],
+        temperature: float = 0.7,
+        max_tokens: int = 1024,
+        **kwargs: Any,
+    ) -> AsyncIterator[str]:
+        """Stream completion response from Anthropic."""
+        resolved_model = self._resolve_model(model)
+        # Convert from OpenAI format to Anthropic format
+        system_prompt = None
+        anthropic_messages = []
+        for msg in messages:
+            if msg["role"] == "system":
+                system_prompt = msg["content"]
+            else:
+                anthropic_messages.append(
+                    {
+                        "role": msg["role"],
+                        "content": msg["content"],
+                    }
+                )
+        try:
+            async with self.client.messages.stream(
+                model=resolved_model,
+                messages=anthropic_messages,
+                system=system_prompt or "",
+                temperature=temperature,
+                max_tokens=max_tokens,
+                **kwargs,
+            ) as stream:
+                async for text in stream.text_stream:
+                    yield text
+        except Exception as e:
+            raise ProviderError(
+                str(e),
+                provider=self.provider_name,
+                model=model,
+            ) from e
+    def list_models(self) -> list[ModelInfo]:
+        """List available Anthropic models."""
+        return list(ANTHROPIC_MODELS.values())
+    def _calculate_cost(self, model: str, input_tokens: int, output_tokens: int) -> float | None:
+        """Calculate cost in USD for a request."""
+        model_info = ANTHROPIC_MODELS.get(model)
+        if not model_info or not model_info.input_cost_per_million:
+            return None
+        input_cost = (input_tokens / 1_000_000) * model_info.input_cost_per_million
+        output_cost = (output_tokens / 1_000_000) * (model_info.output_cost_per_million or 0)
+        return round(input_cost + output_cost, 6)

sandboxy/providers/base.py ADDED Viewed

@@ -0,0 +1,123 @@
+"""Base provider interface and common types."""
+from abc import ABC, abstractmethod
+from collections.abc import AsyncIterator
+from dataclasses import dataclass, field
+from typing import Any
+class ProviderError(Exception):
+    """Error from an LLM provider."""
+    def __init__(self, message: str, provider: str, model: str | None = None):
+        """Initialize provider error.
+        Args:
+            message: Error description
+            provider: Provider name that raised the error
+            model: Model ID if applicable
+        """
+        self.provider = provider
+        self.model = model
+        super().__init__(f"[{provider}] {message}")
+@dataclass
+class ModelResponse:
+    """Response from a model completion."""
+    content: str
+    model_id: str
+    latency_ms: int
+    input_tokens: int
+    output_tokens: int
+    cost_usd: float | None = None
+    finish_reason: str | None = None
+    raw_response: dict[str, Any] | None = field(default=None, repr=False)
+@dataclass
+class ModelInfo:
+    """Information about an available model."""
+    id: str
+    name: str
+    provider: str
+    context_length: int
+    input_cost_per_million: float | None = None
+    output_cost_per_million: float | None = None
+    supports_tools: bool = True
+    supports_vision: bool = False
+    supports_streaming: bool = True
+class BaseProvider(ABC):
+    """Abstract base class for LLM providers."""
+    provider_name: str = "base"
+    @abstractmethod
+    async def complete(
+        self,
+        model: str,
+        messages: list[dict[str, Any]],
+        temperature: float = 0.7,
+        max_tokens: int = 1024,
+        **kwargs: Any,
+    ) -> ModelResponse:
+        """Send a completion request to the model.
+        Args:
+            model: Model identifier (e.g., "gpt-4o", "claude-3-opus")
+            messages: List of message dicts with 'role' and 'content'
+            temperature: Sampling temperature (0-2)
+            max_tokens: Maximum tokens in response
+            **kwargs: Provider-specific options
+        Returns:
+            ModelResponse with content and metadata
+        Raises:
+            ProviderError: If the request fails
+        """
+        pass
+    async def stream(
+        self,
+        model: str,
+        messages: list[dict[str, Any]],
+        temperature: float = 0.7,
+        max_tokens: int = 1024,
+        **kwargs: Any,
+    ) -> AsyncIterator[str]:
+        """Stream a completion response.
+        Default implementation falls back to non-streaming.
+        Override in subclasses for true streaming support.
+        """
+        response = await self.complete(model, messages, temperature, max_tokens, **kwargs)
+        yield response.content
+    @abstractmethod
+    def list_models(self) -> list[ModelInfo]:
+        """List available models from this provider.
+        Returns:
+            List of ModelInfo objects
+        """
+        pass
+    def supports_model(self, model_id: str) -> bool:
+        """Check if this provider supports a given model.
+        Args:
+            model_id: Model identifier to check
+        Returns:
+            True if the model is supported
+        """
+        return any(m.id == model_id for m in self.list_models())

sandboxy/providers/http_client.py ADDED Viewed

@@ -0,0 +1,101 @@
+"""Shared HTTP client with connection pooling.
+Provides a singleton httpx.AsyncClient that reuses connections across requests,
+significantly improving performance for repeated API calls.
+Configuration via environment:
+    SANDBOXY_HTTP_TIMEOUT: Request timeout in seconds (default: 120)
+    SANDBOXY_HTTP_CONNECT_TIMEOUT: Connection timeout in seconds (default: 10)
+    SANDBOXY_HTTP_POOL_CONNECTIONS: Max keepalive connections (default: 20)
+    SANDBOXY_HTTP_POOL_MAXSIZE: Max total connections (default: 100)
+"""
+import logging
+import os
+from collections.abc import AsyncIterator
+from contextlib import asynccontextmanager
+import httpx
+logger = logging.getLogger(__name__)
+# Global client instance
+_client: httpx.AsyncClient | None = None
+# Configuration from environment
+_TIMEOUT = float(os.environ.get("SANDBOXY_HTTP_TIMEOUT", "120"))
+_CONNECT_TIMEOUT = float(os.environ.get("SANDBOXY_HTTP_CONNECT_TIMEOUT", "10"))
+_POOL_CONNECTIONS = int(os.environ.get("SANDBOXY_HTTP_POOL_CONNECTIONS", "20"))
+_POOL_MAXSIZE = int(os.environ.get("SANDBOXY_HTTP_POOL_MAXSIZE", "100"))
+def _create_client() -> httpx.AsyncClient:
+    """Create a new HTTP client with connection pooling."""
+    return httpx.AsyncClient(
+        timeout=httpx.Timeout(
+            _TIMEOUT,
+            connect=_CONNECT_TIMEOUT,
+        ),
+        limits=httpx.Limits(
+            max_keepalive_connections=_POOL_CONNECTIONS,
+            max_connections=_POOL_MAXSIZE,
+            keepalive_expiry=30.0,  # Keep idle connections for 30 seconds
+        ),
+        # HTTP/2 disabled - requires h2 package (pip install httpx[http2])
+        # HTTP/1.1 works fine for API calls
+        http2=False,
+    )
+def get_http_client() -> httpx.AsyncClient:
+    """Get the shared HTTP client with connection pooling.
+    The client is created lazily on first access and reused for all subsequent
+    requests. This provides significant performance benefits for repeated API calls.
+    Returns:
+        Shared httpx.AsyncClient instance.
+    Usage:
+        client = get_http_client()
+        response = await client.post(url, json=data)
+    """
+    global _client
+    if _client is None:
+        _client = _create_client()
+        logger.debug(
+            f"HTTP client created: pool_connections={_POOL_CONNECTIONS}, "
+            f"pool_maxsize={_POOL_MAXSIZE}, timeout={_TIMEOUT}s"
+        )
+    return _client
+async def close_http_client() -> None:
+    """Close the shared HTTP client.
+    Should be called during application shutdown to cleanly close connections.
+    """
+    global _client
+    if _client is not None:
+        await _client.aclose()
+        _client = None
+        logger.debug("HTTP client closed")
+@asynccontextmanager
+async def http_client_lifespan() -> AsyncIterator[httpx.AsyncClient]:
+    """Context manager for HTTP client lifecycle.
+    Use this in application lifespan to ensure proper cleanup:
+        async with http_client_lifespan() as client:
+            # Application runs here
+            pass
+        # Client is automatically closed on exit
+    """
+    client = get_http_client()
+    try:
+        yield client
+    finally:
+        await close_http_client()