PyPI - sandboxy - Versions diffs - 0.0.1__py3-none-any.whl - Mend

sandboxy 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (60) hide show

sandboxy/__init__.py +3 -0
sandboxy/agents/__init__.py +21 -0
sandboxy/agents/base.py +66 -0
sandboxy/agents/llm_prompt.py +308 -0
sandboxy/agents/loader.py +222 -0
sandboxy/api/__init__.py +5 -0
sandboxy/api/app.py +76 -0
sandboxy/api/routes/__init__.py +1 -0
sandboxy/api/routes/agents.py +92 -0
sandboxy/api/routes/local.py +1388 -0
sandboxy/api/routes/tools.py +106 -0
sandboxy/cli/__init__.py +1 -0
sandboxy/cli/main.py +1196 -0
sandboxy/cli/type_detector.py +48 -0
sandboxy/config.py +49 -0
sandboxy/core/__init__.py +1 -0
sandboxy/core/async_runner.py +824 -0
sandboxy/core/mdl_parser.py +441 -0
sandboxy/core/runner.py +599 -0
sandboxy/core/safe_eval.py +165 -0
sandboxy/core/state.py +234 -0
sandboxy/datasets/__init__.py +20 -0
sandboxy/datasets/loader.py +193 -0
sandboxy/datasets/runner.py +442 -0
sandboxy/errors.py +166 -0
sandboxy/local/context.py +235 -0
sandboxy/local/results.py +173 -0
sandboxy/logging.py +31 -0
sandboxy/mcp/__init__.py +25 -0
sandboxy/mcp/client.py +360 -0
sandboxy/mcp/wrapper.py +99 -0
sandboxy/providers/__init__.py +34 -0
sandboxy/providers/anthropic_provider.py +271 -0
sandboxy/providers/base.py +123 -0
sandboxy/providers/http_client.py +101 -0
sandboxy/providers/openai_provider.py +282 -0
sandboxy/providers/openrouter.py +958 -0
sandboxy/providers/registry.py +199 -0
sandboxy/scenarios/__init__.py +11 -0
sandboxy/scenarios/comparison.py +491 -0
sandboxy/scenarios/loader.py +262 -0
sandboxy/scenarios/runner.py +468 -0
sandboxy/scenarios/unified.py +1434 -0
sandboxy/session/__init__.py +21 -0
sandboxy/session/manager.py +278 -0
sandboxy/tools/__init__.py +34 -0
sandboxy/tools/base.py +127 -0
sandboxy/tools/loader.py +270 -0
sandboxy/tools/yaml_tools.py +708 -0
sandboxy/ui/__init__.py +27 -0
sandboxy/ui/dist/assets/index-CgAkYWrJ.css +1 -0
sandboxy/ui/dist/assets/index-D4zoGFcr.js +347 -0
sandboxy/ui/dist/index.html +14 -0
sandboxy/utils/__init__.py +3 -0
sandboxy/utils/time.py +20 -0
sandboxy-0.0.1.dist-info/METADATA +241 -0
sandboxy-0.0.1.dist-info/RECORD +60 -0
sandboxy-0.0.1.dist-info/WHEEL +4 -0
sandboxy-0.0.1.dist-info/entry_points.txt +3 -0
sandboxy-0.0.1.dist-info/licenses/LICENSE +201 -0

sandboxy/core/mdl_parser.py ADDED Viewed

@@ -0,0 +1,441 @@
+"""MDL (Module Definition Language) parser - YAML to ModuleSpec."""
+import logging
+import re
+from pathlib import Path
+from typing import Any
+import yaml
+logger = logging.getLogger(__name__)
+from sandboxy.core.state import (
+    EnvConfig,
+    EvaluationCheck,
+    ModuleSpec,
+    ModuleVariable,
+    ScoringConfig,
+    Step,
+    ToolRef,
+    VariableOption,
+)
+class MDLParseError(Exception):
+    """Error parsing MDL module."""
+    pass
+def load_module(path: Path) -> ModuleSpec:
+    """Load and parse an MDL module from a YAML file.
+    Args:
+        path: Path to the YAML module file.
+    Returns:
+        Parsed ModuleSpec.
+    Raises:
+        MDLParseError: If the file cannot be parsed or is invalid.
+    """
+    try:
+        raw: dict[str, Any] = yaml.safe_load(path.read_text())
+    except yaml.YAMLError as e:
+        raise MDLParseError(f"Invalid YAML: {e}") from e
+    except FileNotFoundError as e:
+        raise MDLParseError(f"File not found: {path}") from e
+    if not isinstance(raw, dict):
+        raise MDLParseError("Module must be a YAML mapping")
+    return parse_module(raw)
+def parse_module(raw: dict[str, Any]) -> ModuleSpec:
+    """Parse a raw dictionary into a ModuleSpec.
+    Args:
+        raw: Raw dictionary from YAML parsing.
+    Returns:
+        Parsed ModuleSpec.
+    Raises:
+        MDLParseError: If required fields are missing or invalid.
+    """
+    if "id" not in raw:
+        raise MDLParseError("Module must have an 'id' field")
+    # Parse variables
+    variables = []
+    for v in raw.get("variables", []):
+        options = None
+        if v.get("options"):
+            options = [VariableOption(value=o["value"], label=o["label"]) for o in v["options"]]
+        variables.append(
+            ModuleVariable(
+                name=v["name"],
+                label=v.get("label", v["name"]),
+                description=v.get("description", ""),
+                type=v.get("type", "string"),
+                default=v.get("default"),
+                options=options,
+                min=v.get("min"),
+                max=v.get("max"),
+                step=v.get("step"),
+            )
+        )
+    # Parse environment
+    env_raw = raw.get("environment", {})
+    tools = [
+        ToolRef(
+            name=t["name"],
+            type=t["type"],
+            description=t.get("description", ""),
+            config=t.get("config", {}),
+        )
+        for t in env_raw.get("tools", [])
+    ]
+    environment = EnvConfig(
+        sandbox_type=env_raw.get("sandbox_type", "local"),
+        tools=tools,
+        initial_state=env_raw.get("initial_state", {}),
+    )
+    # Parse steps (with condition support)
+    steps = [
+        Step(
+            id=s["id"],
+            action=s["action"],
+            params=s.get("params", {}),
+            condition=s.get("condition"),
+        )
+        for s in raw.get("steps", [])
+    ]
+    # Parse branches
+    branches: dict[str, list[Step]] = {}
+    for name, branch_steps in (raw.get("branches") or {}).items():
+        branches[name] = [
+            Step(
+                id=s["id"],
+                action=s["action"],
+                params=s.get("params", {}),
+                condition=s.get("condition"),
+            )
+            for s in branch_steps
+        ]
+    # Parse evaluation
+    evaluation = []
+    for e in raw.get("evaluation", []):
+        check = EvaluationCheck(
+            name=e["name"],
+            kind=e["kind"],
+            # Common fields
+            target=e.get("target"),
+            value=e.get("value"),
+            expected=e.get("expected", True),
+            # Type-specific fields
+            pattern=e.get("pattern"),
+            case_sensitive=e.get("case_sensitive", False),
+            min=e.get("min"),
+            max=e.get("max"),
+            tool=e.get("tool"),
+            action=e.get("action"),
+            key=e.get("key"),
+            # Legacy support
+            config=e.get("config", {}),
+        )
+        evaluation.append(check)
+    # Parse agent_config (support both keys)
+    agent_config = raw.get("agent_config") or raw.get("agent", {})
+    if isinstance(agent_config, dict) and "system_prompt" not in agent_config:
+        # Handle "agent:" block with system_prompt inside
+        if "system_prompt" in raw.get("agent", {}):
+            agent_config = raw["agent"]
+    # Parse scoring config
+    scoring_raw = raw.get("scoring", {})
+    scoring = ScoringConfig(
+        formula=scoring_raw.get("formula"),
+        weights=scoring_raw.get("weights", {}),
+        normalize=scoring_raw.get("normalize", False),
+        min_score=scoring_raw.get("min_score", 0.0),
+        max_score=scoring_raw.get("max_score", 100.0),
+    )
+    return ModuleSpec(
+        id=raw["id"],
+        description=raw.get("description", ""),
+        variables=variables,
+        agent_config=agent_config,
+        environment=environment,
+        steps=steps,
+        branches=branches,
+        evaluation=evaluation,
+        scoring=scoring,
+    )
+def interpolate_template(text: str, variables: dict[str, Any]) -> str:
+    """Interpolate variables into a template string.
+    Supports:
+    - {{variable}} - Simple variable substitution
+    - {{#if condition}}...{{else if condition}}...{{else}}...{{/if}} - Conditional blocks with else-if
+    Args:
+        text: Template string with {{variable}} placeholders.
+        variables: Dictionary of variable values.
+    Returns:
+        Interpolated string.
+    """
+    if not text:
+        return text
+    # Process conditional blocks with support for else-if chains
+    # Match {{#if ...}}...{{/if}} blocks
+    if_pattern = re.compile(r"\{\{#if\s+(.+?)\}\}(.*?)\{\{/if\}\}", re.DOTALL)
+    def eval_if_block(match: re.Match) -> str:
+        condition = match.group(1).strip()
+        body = match.group(2) or ""
+        # Parse the body for else-if and else clauses
+        # Split by {{else if ...}} and {{else}}
+        parts = re.split(r"\{\{else if\s+(.+?)\}\}|\{\{else\}\}", body)
+        # parts[0] is the content for the first if condition
+        # Then alternating: condition (or None for else), content
+        # Build list of (condition, content) tuples
+        branches: list[tuple[str | None, str]] = [(condition, parts[0])]
+        i = 1
+        while i < len(parts):
+            if i + 1 < len(parts) and parts[i] is not None:
+                # This is an else-if: parts[i] is condition, parts[i+1] is content
+                branches.append((parts[i].strip(), parts[i + 1]))
+                i += 2
+            elif parts[i] is None:
+                # This is an else: content is in the next part
+                if i + 1 < len(parts):
+                    branches.append((None, parts[i + 1]))
+                    i += 2
+                else:
+                    i += 1
+            else:
+                # Orphaned content (shouldn't happen in well-formed templates)
+                branches.append((None, parts[i]))
+                i += 1
+        # Evaluate branches in order
+        for cond, content in branches:
+            if cond is None:
+                # This is the else clause - always matches
+                return content.strip()
+            try:
+                if _eval_condition(cond, variables):
+                    return content.strip()
+            except Exception:
+                continue
+        # No branch matched
+        return ""
+    text = if_pattern.sub(eval_if_block, text)
+    # Simple variable substitution: {{variable}}
+    def replace_var(match: re.Match) -> str:
+        var_name = match.group(1).strip()
+        return str(variables.get(var_name, f"{{{{{var_name}}}}}"))
+    var_pattern = re.compile(r"\{\{(\w+)\}\}")
+    text = var_pattern.sub(replace_var, text)
+    return text
+def _eval_condition(condition: str, variables: dict[str, Any]) -> bool:
+    """Safely evaluate a condition expression.
+    Args:
+        condition: Condition expression (e.g., "sophistication >= 7").
+        variables: Dictionary of variable values.
+    Returns:
+        Boolean result of condition evaluation.
+    """
+    # Safe builtins for condition evaluation
+    safe_builtins = {
+        "True": True,
+        "False": False,
+        "None": None,
+        "len": len,
+        "str": str,
+        "int": int,
+        "float": float,
+        "bool": bool,
+    }
+    # Create evaluation context
+    safe_globals = {"__builtins__": safe_builtins}
+    safe_globals.update(variables)
+    try:
+        return bool(eval(condition, safe_globals, {}))
+    except Exception:
+        return False
+def _interpolate_value(value: Any, var_dict: dict[str, Any]) -> Any:
+    """Recursively interpolate variables in a value.
+    Handles strings, dicts, and lists. For strings that look like
+    pure variable references (e.g., "{{starting_cash}}"), attempts
+    to return the actual typed value instead of a string.
+    """
+    if isinstance(value, str):
+        # Check if it's a pure variable reference like "{{var_name}}"
+        pure_var_match = re.match(r"^\{\{(\w+)\}\}$", value.strip())
+        if pure_var_match:
+            var_name = pure_var_match.group(1)
+            if var_name in var_dict:
+                return var_dict[var_name]
+        # Otherwise do string interpolation
+        return interpolate_template(value, var_dict)
+    if isinstance(value, dict):
+        return {k: _interpolate_value(v, var_dict) for k, v in value.items()}
+    if isinstance(value, list):
+        return [_interpolate_value(item, var_dict) for item in value]
+    return value
+def apply_variables(module: ModuleSpec, variables: dict[str, Any]) -> ModuleSpec:
+    """Apply variable values to a module, interpolating templates.
+    Args:
+        module: Module specification.
+        variables: Dictionary of variable values (from user or defaults).
+    Returns:
+        New ModuleSpec with interpolated values.
+    """
+    # Build complete variable dict with defaults
+    var_dict: dict[str, Any] = {}
+    for var in module.variables:
+        var_dict[var.name] = var.default
+    var_dict.update(variables)
+    # Interpolate agent_config system_prompt
+    agent_config = dict(module.agent_config)
+    if "system_prompt" in agent_config:
+        agent_config["system_prompt"] = interpolate_template(
+            agent_config["system_prompt"], var_dict
+        )
+    # Interpolate environment config (tools and initial_state)
+    new_tools = []
+    for tool in module.environment.tools:
+        new_config = _interpolate_value(tool.config, var_dict)
+        new_tools.append(
+            ToolRef(
+                name=tool.name,
+                type=tool.type,
+                description=tool.description,
+                config=new_config,
+            )
+        )
+    new_initial_state = _interpolate_value(dict(module.environment.initial_state), var_dict)
+    new_environment = EnvConfig(
+        sandbox_type=module.environment.sandbox_type,
+        tools=new_tools,
+        initial_state=new_initial_state,
+    )
+    # Interpolate step params and filter by condition
+    new_steps: list[Step] = []
+    for step in module.steps:
+        # Check condition if present
+        if step.condition:
+            if not _eval_condition(step.condition, var_dict):
+                continue  # Skip this step
+        # Interpolate params
+        new_params = _interpolate_value(dict(step.params), var_dict)
+        new_steps.append(
+            Step(
+                id=step.id,
+                action=step.action,
+                params=new_params,
+                condition=None,  # Condition already evaluated
+            )
+        )
+    # Return new module with interpolated values
+    return ModuleSpec(
+        id=module.id,
+        description=module.description,
+        variables=module.variables,
+        agent_config=agent_config,
+        environment=new_environment,
+        steps=new_steps,
+        branches=module.branches,  # TODO: interpolate branches too if needed
+        evaluation=module.evaluation,
+        scoring=module.scoring,
+    )
+def validate_module(path: Path) -> list[str]:
+    """Validate an MDL module and return any errors.
+    Args:
+        path: Path to the YAML module file.
+    Returns:
+        List of validation error messages (empty if valid).
+    """
+    errors: list[str] = []
+    try:
+        module = load_module(path)
+    except MDLParseError as e:
+        return [str(e)]
+    # Validate steps have valid actions
+    valid_actions = {"inject_user", "await_user", "await_agent", "branch", "tool_call"}
+    for step in module.steps:
+        if step.action not in valid_actions:
+            errors.append(f"Step '{step.id}' has invalid action: {step.action}")
+    # Validate branch references exist
+    for step in module.steps:
+        if step.action == "branch":
+            branch_name = step.params.get("branch_name")
+            if branch_name and branch_name not in module.branches:
+                errors.append(f"Step '{step.id}' references unknown branch: {branch_name}")
+    # Validate evaluation checks have valid kinds
+    valid_kinds = {
+        "contains",
+        "regex",
+        "count",
+        "tool_called",
+        "equals",
+        "env_state",
+        "deterministic",
+        "llm",
+    }
+    for check in module.evaluation:
+        if check.kind not in valid_kinds:
+            errors.append(f"Evaluation '{check.name}' has invalid kind: {check.kind}")
+    return errors