PyPI - sandboxy - Versions diffs - 0.0.1__py3-none-any.whl - Mend

sandboxy 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

sandboxy/__init__.py +3 -0
sandboxy/agents/__init__.py +21 -0
sandboxy/agents/base.py +66 -0
sandboxy/agents/llm_prompt.py +308 -0
sandboxy/agents/loader.py +222 -0
sandboxy/api/__init__.py +5 -0
sandboxy/api/app.py +76 -0
sandboxy/api/routes/__init__.py +1 -0
sandboxy/api/routes/agents.py +92 -0
sandboxy/api/routes/local.py +1388 -0
sandboxy/api/routes/tools.py +106 -0
sandboxy/cli/__init__.py +1 -0
sandboxy/cli/main.py +1196 -0
sandboxy/cli/type_detector.py +48 -0
sandboxy/config.py +49 -0
sandboxy/core/__init__.py +1 -0
sandboxy/core/async_runner.py +824 -0
sandboxy/core/mdl_parser.py +441 -0
sandboxy/core/runner.py +599 -0
sandboxy/core/safe_eval.py +165 -0
sandboxy/core/state.py +234 -0
sandboxy/datasets/__init__.py +20 -0
sandboxy/datasets/loader.py +193 -0
sandboxy/datasets/runner.py +442 -0
sandboxy/errors.py +166 -0
sandboxy/local/context.py +235 -0
sandboxy/local/results.py +173 -0
sandboxy/logging.py +31 -0
sandboxy/mcp/__init__.py +25 -0
sandboxy/mcp/client.py +360 -0
sandboxy/mcp/wrapper.py +99 -0
sandboxy/providers/__init__.py +34 -0
sandboxy/providers/anthropic_provider.py +271 -0
sandboxy/providers/base.py +123 -0
sandboxy/providers/http_client.py +101 -0
sandboxy/providers/openai_provider.py +282 -0
sandboxy/providers/openrouter.py +958 -0
sandboxy/providers/registry.py +199 -0
sandboxy/scenarios/__init__.py +11 -0
sandboxy/scenarios/comparison.py +491 -0
sandboxy/scenarios/loader.py +262 -0
sandboxy/scenarios/runner.py +468 -0
sandboxy/scenarios/unified.py +1434 -0
sandboxy/session/__init__.py +21 -0
sandboxy/session/manager.py +278 -0
sandboxy/tools/__init__.py +34 -0
sandboxy/tools/base.py +127 -0
sandboxy/tools/loader.py +270 -0
sandboxy/tools/yaml_tools.py +708 -0
sandboxy/ui/__init__.py +27 -0
sandboxy/ui/dist/assets/index-CgAkYWrJ.css +1 -0
sandboxy/ui/dist/assets/index-D4zoGFcr.js +347 -0
sandboxy/ui/dist/index.html +14 -0
sandboxy/utils/__init__.py +3 -0
sandboxy/utils/time.py +20 -0
sandboxy-0.0.1.dist-info/METADATA +241 -0
sandboxy-0.0.1.dist-info/RECORD +60 -0
sandboxy-0.0.1.dist-info/WHEEL +4 -0
sandboxy-0.0.1.dist-info/entry_points.txt +3 -0
sandboxy-0.0.1.dist-info/licenses/LICENSE +201 -0

sandboxy/session/__init__.py ADDED Viewed

@@ -0,0 +1,21 @@
+"""Session management for interactive Sandboxy sessions.
+This module provides session management for coordinating interactive sessions
+between WebSocket connections and the AsyncRunner. It maintains in-memory
+session state for local development and testing.
+Typical usage:
+    from sandboxy.session import SessionManager, Session
+    manager = SessionManager()
+    session = manager.create_session(module, agent)
+    event_queue = await manager.start_session(session.id)
+"""
+from sandboxy.session.manager import Session, SessionManager, session_manager
+__all__ = [
+    "Session",
+    "SessionManager",
+    "session_manager",
+]

sandboxy/session/manager.py ADDED Viewed

@@ -0,0 +1,278 @@
+"""Session Manager - coordinates interactive sessions between WebSocket and AsyncRunner."""
+import asyncio
+import logging
+from dataclasses import dataclass, field
+from typing import Any
+from uuid import uuid4
+from sandboxy.agents.base import Agent
+from sandboxy.core.async_runner import AsyncRunner, RunEvent
+from sandboxy.core.state import ModuleSpec, SessionState
+logger = logging.getLogger(__name__)
+@dataclass
+class Session:
+    """An active interactive session."""
+    id: str
+    module: ModuleSpec
+    agent: Agent
+    variables: dict[str, Any]
+    runner: AsyncRunner
+    events: list[RunEvent] = field(default_factory=list)
+    _run_task: asyncio.Task | None = None
+    _event_queue: asyncio.Queue[RunEvent] = field(default_factory=asyncio.Queue)
+    @property
+    def state(self) -> SessionState:
+        """Get current session state."""
+        return self.runner.session_state
+class SessionManager:
+    """Manages active interactive sessions.
+    In-memory session store for local development and testing.
+    """
+    def __init__(self):
+        self._sessions: dict[str, Session] = {}
+    def create_session(
+        self,
+        module: ModuleSpec,
+        agent: Agent,
+        variables: dict[str, Any] | None = None,
+    ) -> Session:
+        """Create a new session.
+        Args:
+            module: Module specification to run.
+            agent: Agent to use for the session.
+            variables: Optional variables for the module.
+        Returns:
+            The created Session object.
+        """
+        session_id = str(uuid4())
+        runner = AsyncRunner(module, agent)
+        session = Session(
+            id=session_id,
+            module=module,
+            agent=agent,
+            variables=variables or {},
+            runner=runner,
+        )
+        self._sessions[session_id] = session
+        logger.info("Created session %s for module %s", session_id, module.name)
+        return session
+    def get_session(self, session_id: str) -> Session | None:
+        """Get a session by ID."""
+        return self._sessions.get(session_id)
+    def delete_session(self, session_id: str) -> bool:
+        """Delete a session.
+        Returns:
+            True if session was deleted, False if not found.
+        """
+        if session_id in self._sessions:
+            session = self._sessions[session_id]
+            # Cancel running task if any
+            if session._run_task and not session._run_task.done():
+                session._run_task.cancel()
+            del self._sessions[session_id]
+            logger.info("Deleted session %s", session_id)
+            return True
+        logger.debug("Attempted to delete non-existent session %s", session_id)
+        return False
+    def list_sessions(self) -> list[Session]:
+        """List all active sessions."""
+        return list(self._sessions.values())
+    async def start_session(self, session_id: str) -> asyncio.Queue[RunEvent]:
+        """Start running a session.
+        Args:
+            session_id: ID of the session to start.
+        Returns:
+            Queue that will receive events as they occur.
+        Raises:
+            ValueError: If session not found.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            logger.warning("Attempted to start non-existent session %s", session_id)
+            raise ValueError(f"Session not found: {session_id}")
+        # Start the runner in a background task
+        session._run_task = asyncio.create_task(self._run_session(session))
+        logger.info("Started session %s", session_id)
+        return session._event_queue
+    async def _run_session(self, session: Session) -> None:
+        """Run a session, pushing events to its queue."""
+        logger.debug("Running session %s", session.id)
+        try:
+            async for event in session.runner.run():
+                session.events.append(event)
+                await session._event_queue.put(event)
+                logger.debug("Session %s emitted event: %s", session.id, event.type)
+        except asyncio.CancelledError:
+            logger.info("Session %s was cancelled", session.id)
+        except Exception as e:
+            logger.exception("Session %s encountered error: %s", session.id, e)
+            # Push error event
+            error_event = RunEvent(type="error", payload={"message": str(e)})
+            session.events.append(error_event)
+            await session._event_queue.put(error_event)
+    def provide_input(self, session_id: str, content: str) -> None:
+        """Provide user input for a session.
+        Args:
+            session_id: ID of the session.
+            content: User's input text.
+        Raises:
+            ValueError: If session not found.
+            RuntimeError: If session is not awaiting input.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            logger.warning("Attempted to provide input to non-existent session %s", session_id)
+            raise ValueError(f"Session not found: {session_id}")
+        logger.debug("Providing input to session %s", session_id)
+        session.runner.provide_input(content)
+    def inject_event(
+        self,
+        session_id: str,
+        tool_name: str,
+        event_type: str,
+        args: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        """Inject a game event into a session.
+        This triggers an event in the specified tool (e.g., "heatwave" in
+        the lemonade stand). The event modifies game state and returns
+        a description that should be shown to the user/agent.
+        Args:
+            session_id: ID of the session.
+            tool_name: Name of the tool to call.
+            event_type: Type of event to trigger.
+            args: Optional additional arguments.
+        Returns:
+            The event result data from the tool.
+        Raises:
+            ValueError: If session not found or event fails.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            logger.warning("Attempted to inject event into non-existent session %s", session_id)
+            raise ValueError(f"Session not found: {session_id}")
+        logger.info(
+            "Injecting event %s into session %s via tool %s", event_type, session_id, tool_name
+        )
+        return session.runner.inject_event(tool_name, event_type, args)
+    def pause_session(self, session_id: str) -> bool:
+        """Pause a session (not fully implemented yet)."""
+        session = self.get_session(session_id)
+        if not session:
+            logger.debug("Attempted to pause non-existent session %s", session_id)
+            return False
+        # TODO: Implement proper pause mechanism
+        logger.debug("Pause requested for session %s (not yet implemented)", session_id)
+        return True
+    def resume_session(self, session_id: str) -> bool:
+        """Resume a paused session (not fully implemented yet)."""
+        session = self.get_session(session_id)
+        if not session:
+            logger.debug("Attempted to resume non-existent session %s", session_id)
+            return False
+        # TODO: Implement proper resume mechanism
+        logger.debug("Resume requested for session %s (not yet implemented)", session_id)
+        return True
+    def mark_session_ended(self, session_id: str) -> bool:
+        """Mark a session as ended (connection closed).
+        Unlike delete_session, this preserves the session data for
+        potential replay or export. The session will be cleaned up
+        after a timeout or when explicitly deleted.
+        Args:
+            session_id: ID of the session.
+        Returns:
+            True if session was marked, False if not found.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            logger.debug("Attempted to mark non-existent session %s as ended", session_id)
+            return False
+        # Cancel running task if any
+        if session._run_task and not session._run_task.done():
+            session._run_task.cancel()
+        logger.info("Marked session %s as ended", session_id)
+        return True
+    def get_session_events(self, session_id: str) -> list[RunEvent]:
+        """Get all events for a session.
+        Args:
+            session_id: ID of the session.
+        Returns:
+            List of events, or empty list if session not found.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            return []
+        return list(session.events)
+    def get_session_state(self, session_id: str) -> dict[str, Any] | None:
+        """Get the current environment state for a session.
+        Args:
+            session_id: ID of the session.
+        Returns:
+            The environment state dict, or None if session not found.
+        """
+        session = self.get_session(session_id)
+        if not session:
+            return None
+        return session.runner.env_state
+# Global session manager instance
+session_manager = SessionManager()

sandboxy/tools/__init__.py ADDED Viewed

@@ -0,0 +1,34 @@
+"""Tools module - Tool interface, loader, and YAML tool implementations.
+This module provides the core abstractions for defining and loading tools
+that can be used by AI agents in sandbox scenarios.
+Submodules:
+    sandboxy.tools.base:
+        - Tool: Protocol defining the tool interface
+        - BaseTool: Base class for tool implementations
+        - ToolConfig: Configuration model for tool instances
+        - ToolResult: Result model for tool invocations
+    sandboxy.tools.loader:
+        - ToolLoader: Loader for creating tool instances from config
+        - get_yaml_tool_libraries: List available YAML tool libraries
+        - load_tool_class: Load a tool class from module path
+        - load_yaml_tool_library: Load tools from a YAML library
+        - load_yaml_tools_from_scenario: Load tools from scenario data
+    sandboxy.tools.yaml_tools:
+        - YamlMockTool: YAML-defined mock tool implementation
+        - YamlToolLoader: Loader for YAML tool libraries
+        - ActionSpec: Specification for a tool action
+        - ParamSchema: Schema for action parameters
+        - SideEffect: State modification specification
+        - ToolSpec: Full tool specification
+        - ToolLibrary: Collection of tool specifications
+        - load_scenario_tools: Load tools from scenario data
+Note:
+    Import directly from submodules to avoid circular dependencies:
+        from sandboxy.tools.base import BaseTool, ToolConfig, ToolResult
+        from sandboxy.tools.loader import ToolLoader
+"""

sandboxy/tools/base.py ADDED Viewed

@@ -0,0 +1,127 @@
+"""Base tool interface and models.
+This module defines the core abstractions for tools:
+    - ToolConfig: Configuration for instantiating a tool
+    - ToolResult: Result of a tool invocation
+    - Tool: Protocol defining the tool interface
+    - BaseTool: Base implementation for custom tools
+"""
+from typing import Any, Protocol
+from pydantic import BaseModel, Field
+class ToolConfig(BaseModel):
+    """Configuration for a tool instance.
+    Attributes:
+        name: Unique identifier for this tool instance.
+        type: Tool type identifier (e.g., 'yaml_tool', 'mock_lemonade').
+        description: Human-readable description of the tool.
+        config: Tool-specific configuration options.
+    """
+    name: str
+    type: str
+    description: str = ""
+    config: dict[str, Any] = Field(default_factory=dict)
+class ToolResult(BaseModel):
+    """Result of a tool invocation.
+    Attributes:
+        success: Whether the invocation succeeded.
+        data: Result data on success (type varies by action).
+        error: Error message on failure.
+    """
+    success: bool
+    data: Any = None
+    error: str | None = None
+class Tool(Protocol):
+    """Protocol for tool implementations.
+    Tools provide actions that agents can invoke to interact with
+    simulated environments. Each tool has a name, description, and
+    a set of available actions.
+    Attributes:
+        name: Unique identifier for the tool.
+        description: Human-readable description of the tool's purpose.
+    """
+    name: str
+    description: str
+    def invoke(self, action: str, args: dict[str, Any], env_state: dict[str, Any]) -> ToolResult:
+        """Invoke a tool action.
+        Args:
+            action: The action to perform (e.g., "get_order", "refund_order").
+            args: Arguments for the action.
+            env_state: Current environment state (can be modified by tools).
+        Returns:
+            Result of the tool invocation.
+        """
+        ...
+    def get_actions(self) -> list[dict[str, Any]]:
+        """Get list of available actions with their schemas.
+        Returns:
+            List of action definitions with name, description, and parameters.
+        """
+        ...
+class BaseTool:
+    """Base class for tool implementations.
+    Subclass this to create custom tools. Override `invoke` to handle
+    actions and `get_actions` to advertise available actions.
+    Attributes:
+        name: Tool instance name from config.
+        description: Tool description from config.
+        config: Tool-specific configuration dict.
+    """
+    def __init__(self, config: ToolConfig) -> None:
+        """Initialize the tool from configuration.
+        Args:
+            config: Tool configuration containing name, description, and options.
+        """
+        self.name = config.name
+        self.description = config.description
+        self.config = config.config
+    def invoke(self, action: str, args: dict[str, Any], env_state: dict[str, Any]) -> ToolResult:
+        """Invoke a tool action.
+        Override in subclasses to implement action handling.
+        Args:
+            action: The action to perform.
+            args: Arguments for the action.
+            env_state: Current environment state (can be modified).
+        Returns:
+            Result of the action invocation.
+        """
+        return ToolResult(success=False, error=f"Unknown action: {action}")
+    def get_actions(self) -> list[dict[str, Any]]:
+        """Get list of available actions with their schemas.
+        Override in subclasses to advertise available actions.
+        Returns:
+            List of action definitions with name, description, and parameters.
+        """
+        return []