PyPI - tollgate - Versions diffs - 1.0.4__py3-none-any.whl → 1.4.0__py3-none-any.whl - Mend

tollgate 1.0.4py3-none-any.whl → 1.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

tollgate/__init__.py +36 -3
tollgate/anomaly_detector.py +396 -0
tollgate/audit.py +90 -1
tollgate/backends/__init__.py +37 -0
tollgate/backends/redis_store.py +411 -0
tollgate/backends/sqlite_store.py +458 -0
tollgate/circuit_breaker.py +206 -0
tollgate/context_monitor.py +292 -0
tollgate/exceptions.py +20 -0
tollgate/grants.py +46 -0
tollgate/manifest_signing.py +90 -0
tollgate/network_guard.py +114 -0
tollgate/policy.py +37 -0
tollgate/policy_testing.py +360 -0
tollgate/rate_limiter.py +162 -0
tollgate/registry.py +225 -2
tollgate/tower.py +184 -12
tollgate/types.py +21 -1
tollgate/verification.py +81 -0
tollgate-1.4.0.dist-info/METADATA +393 -0
tollgate-1.4.0.dist-info/RECORD +33 -0
tollgate-1.4.0.dist-info/entry_points.txt +2 -0
tollgate-1.0.4.dist-info/METADATA +0 -144
tollgate-1.0.4.dist-info/RECORD +0 -21
{tollgate-1.0.4.dist-info → tollgate-1.4.0.dist-info}/WHEEL +0 -0
{tollgate-1.0.4.dist-info → tollgate-1.4.0.dist-info}/licenses/LICENSE +0 -0

tollgate/policy_testing.py ADDED Viewed

@@ -0,0 +1,360 @@
+"""Policy testing framework for Tollgate.
+Enables declarative scenario-based testing of Tollgate policies to prevent
+regressions in CI. Test scenarios are defined in YAML and run against a
+policy evaluator.
+Usage:
+    # From Python:
+    from tollgate.policy_testing import PolicyTestRunner
+    runner = PolicyTestRunner("policy.yaml", "test_scenarios.yaml")
+    results = runner.run()
+    assert results.all_passed
+    # From CLI:
+    tollgate test-policy policy.yaml --scenarios test_scenarios.yaml
+Scenario file format:
+    scenarios:
+      - name: "Allow read operations"
+        description: "Read effects should be allowed for trusted agents"
+        agent:
+          agent_id: "agent-1"
+          version: "1.0"
+          owner: "team-a"
+        intent:
+          action: "fetch_data"
+          reason: "Customer request"
+        tool_request:
+          tool: "api:fetch"
+          action: "get"
+          resource_type: "url"
+          effect: "read"
+          params: {}
+          manifest_version: "1.0.0"
+        expected:
+          decision: "ALLOW"       # Required: ALLOW, ASK, or DENY
+          reason_contains: "Rule"  # Optional: substring match on reason
+          policy_id: "allow_read"  # Optional: exact match on policy_id
+"""
+import sys
+import time
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+import yaml
+from .policy import YamlPolicyEvaluator
+from .types import AgentContext, DecisionType, Effect, Intent, ToolRequest
+@dataclass
+class ScenarioResult:
+    """Result of a single test scenario."""
+    name: str
+    passed: bool
+    expected_decision: str
+    actual_decision: str
+    expected_reason_contains: str | None = None
+    actual_reason: str | None = None
+    expected_policy_id: str | None = None
+    actual_policy_id: str | None = None
+    errors: list[str] = field(default_factory=list)
+    duration_ms: float = 0.0
+    def __str__(self) -> str:
+        status = "PASS" if self.passed else "FAIL"
+        msg = f"  [{status}] {self.name}"
+        if not self.passed:
+            for err in self.errors:
+                msg += f"\n         {err}"
+        return msg
+@dataclass
+class PolicyTestRunResult:
+    """Aggregate result of a test run."""
+    scenario_results: list[ScenarioResult]
+    total: int = 0
+    passed: int = 0
+    failed: int = 0
+    duration_ms: float = 0.0
+    @property
+    def all_passed(self) -> bool:
+        return self.failed == 0
+    def summary(self) -> str:
+        lines = [
+            "",
+            "=" * 60,
+            f"  Policy Test Results: {self.passed}/{self.total} passed",
+            "=" * 60,
+        ]
+        for result in self.scenario_results:
+            lines.append(str(result))
+        lines.append("-" * 60)
+        status = "ALL PASSED" if self.all_passed else f"{self.failed} FAILED"
+        lines.append(f"  {status} ({self.duration_ms:.1f}ms)")
+        lines.append("")
+        return "\n".join(lines)
+class PolicyTestRunner:
+    """Run declarative policy test scenarios.
+    Args:
+        policy_path: Path to the policy YAML file.
+        scenarios_path: Path to the test scenarios YAML file.
+        policy_evaluator: Optional pre-configured evaluator (overrides policy_path).
+    """
+    def __init__(
+        self,
+        policy_path: str | Path | None = None,
+        scenarios_path: str | Path | None = None,
+        *,
+        policy_evaluator: Any | None = None,
+        scenarios: list[dict[str, Any]] | None = None,
+    ):
+        # Load policy
+        if policy_evaluator is not None:
+            self._evaluator = policy_evaluator
+        elif policy_path is not None:
+            self._evaluator = YamlPolicyEvaluator(policy_path)
+        else:
+            raise ValueError("Either policy_path or policy_evaluator must be provided")
+        # Load scenarios
+        if scenarios is not None:
+            self._scenarios = scenarios
+        elif scenarios_path is not None:
+            self._scenarios = self._load_scenarios(scenarios_path)
+        else:
+            raise ValueError("Either scenarios_path or scenarios must be provided")
+        self._validate_scenarios()
+    @staticmethod
+    def _load_scenarios(path: str | Path) -> list[dict[str, Any]]:
+        path = Path(path)
+        if not path.exists():
+            raise FileNotFoundError(f"Scenarios file not found: {path}")
+        with path.open("r") as f:
+            data = yaml.safe_load(f)
+        if not data or "scenarios" not in data:
+            raise ValueError(f"Scenarios file must contain a 'scenarios' key: {path}")
+        return data["scenarios"]
+    def _validate_scenarios(self):
+        """Validate scenario structure before running."""
+        for i, scenario in enumerate(self._scenarios):
+            name = scenario.get("name", f"Scenario {i}")
+            if "expected" not in scenario:
+                raise ValueError(f"Scenario '{name}' is missing 'expected' key")
+            if "decision" not in scenario["expected"]:
+                raise ValueError(
+                    f"Scenario '{name}' expected section must include 'decision'"
+                )
+            try:
+                DecisionType(scenario["expected"]["decision"])
+            except ValueError:
+                raise ValueError(
+                    f"Scenario '{name}' has invalid expected decision: "
+                    f"'{scenario['expected']['decision']}'"
+                ) from None
+    def run(self) -> PolicyTestRunResult:
+        """Run all test scenarios and return results."""
+        start = time.monotonic()
+        results: list[ScenarioResult] = []
+        for scenario in self._scenarios:
+            result = self._run_scenario(scenario)
+            results.append(result)
+        total_ms = (time.monotonic() - start) * 1000
+        passed = sum(1 for r in results if r.passed)
+        failed = len(results) - passed
+        return PolicyTestRunResult(
+            scenario_results=results,
+            total=len(results),
+            passed=passed,
+            failed=failed,
+            duration_ms=total_ms,
+        )
+    def _run_scenario(self, scenario: dict[str, Any]) -> ScenarioResult:
+        """Run a single test scenario."""
+        name = scenario.get("name", "Unnamed scenario")
+        expected = scenario["expected"]
+        expected_decision = expected["decision"]
+        expected_reason_contains = expected.get("reason_contains")
+        expected_policy_id = expected.get("policy_id")
+        start = time.monotonic()
+        errors: list[str] = []
+        try:
+            agent_ctx = self._build_agent_context(scenario.get("agent", {}))
+            intent = self._build_intent(scenario.get("intent", {}))
+            tool_request = self._build_tool_request(scenario.get("tool_request", {}))
+            decision = self._evaluator.evaluate(agent_ctx, intent, tool_request)
+            actual_decision = decision.decision.value
+            actual_reason = decision.reason
+            actual_policy_id = decision.policy_id
+            # Check decision
+            if actual_decision != expected_decision:
+                errors.append(
+                    f"Decision: expected '{expected_decision}', got '{actual_decision}'"
+                )
+            # Check reason (substring match)
+            if expected_reason_contains and expected_reason_contains not in (
+                actual_reason or ""
+            ):
+                errors.append(
+                    f"Reason: expected to contain '{expected_reason_contains}', "
+                    f"got '{actual_reason}'"
+                )
+            # Check policy_id
+            if expected_policy_id and actual_policy_id != expected_policy_id:
+                errors.append(
+                    f"Policy ID: expected '{expected_policy_id}', "
+                    f"got '{actual_policy_id}'"
+                )
+        except Exception as e:
+            actual_decision = "ERROR"
+            actual_reason = str(e)
+            actual_policy_id = None
+            errors.append(f"Exception: {e}")
+        duration_ms = (time.monotonic() - start) * 1000
+        return ScenarioResult(
+            name=name,
+            passed=len(errors) == 0,
+            expected_decision=expected_decision,
+            actual_decision=actual_decision,
+            expected_reason_contains=expected_reason_contains,
+            actual_reason=actual_reason,
+            expected_policy_id=expected_policy_id,
+            actual_policy_id=actual_policy_id,
+            errors=errors,
+            duration_ms=duration_ms,
+        )
+    @staticmethod
+    def _build_agent_context(data: dict[str, Any]) -> AgentContext:
+        delegated_by = data.get("delegated_by")
+        if delegated_by is not None:
+            delegated_by = tuple(delegated_by)
+        else:
+            delegated_by = ()
+        return AgentContext(
+            agent_id=data.get("agent_id", "test-agent"),
+            version=data.get("version", "1.0"),
+            owner=data.get("owner", "test-owner"),
+            metadata=data.get("metadata", {}),
+            delegated_by=delegated_by,
+        )
+    @staticmethod
+    def _build_intent(data: dict[str, Any]) -> Intent:
+        return Intent(
+            action=data.get("action", "test_action"),
+            reason=data.get("reason", "test reason"),
+            confidence=data.get("confidence"),
+            metadata=data.get("metadata", {}),
+        )
+    @staticmethod
+    def _build_tool_request(data: dict[str, Any]) -> ToolRequest:
+        effect_str = data.get("effect", "unknown")
+        try:
+            effect = Effect(effect_str)
+        except ValueError:
+            effect = Effect.UNKNOWN
+        return ToolRequest(
+            tool=data.get("tool", "unknown"),
+            action=data.get("action", "unknown"),
+            resource_type=data.get("resource_type", "unknown"),
+            effect=effect,
+            params=data.get("params", {}),
+            metadata=data.get("metadata", {}),
+            manifest_version=data.get("manifest_version"),
+        )
+def cli_main(args: list[str] | None = None) -> int:
+    """CLI entry point for ``tollgate test-policy``.
+    Usage:
+        tollgate test-policy policy.yaml --scenarios test_scenarios.yaml
+        tollgate test-policy policy.yaml -s test_scenarios.yaml --strict
+    Returns exit code 0 on success, 1 on failure.
+    """
+    import argparse
+    parser = argparse.ArgumentParser(
+        prog="tollgate test-policy",
+        description="Run declarative policy test scenarios against a Tollgate policy.",
+    )
+    parser.add_argument(
+        "policy_path",
+        help="Path to the policy YAML file",
+    )
+    parser.add_argument(
+        "--scenarios", "-s",
+        required=True,
+        help="Path to the test scenarios YAML file",
+    )
+    parser.add_argument(
+        "--strict",
+        action="store_true",
+        help="Exit with code 1 on any failure (default behavior)",
+    )
+    parser.add_argument(
+        "--quiet", "-q",
+        action="store_true",
+        help="Only show failures and summary",
+    )
+    parsed = parser.parse_args(args)
+    try:
+        runner = PolicyTestRunner(parsed.policy_path, parsed.scenarios)
+    except (FileNotFoundError, ValueError) as e:
+        print(f"Error: {e}", file=sys.stderr)
+        return 2
+    results = runner.run()
+    if parsed.quiet:
+        # Only show failures
+        for r in results.scenario_results:
+            if not r.passed:
+                print(str(r))
+        print(f"\n{results.passed}/{results.total} passed, {results.failed} failed")
+    else:
+        print(results.summary())
+    return 0 if results.all_passed else 1

tollgate/rate_limiter.py ADDED Viewed

@@ -0,0 +1,162 @@
+"""Rate limiting for AI agent tool calls.
+Provides a sliding-window rate limiter that tracks per-agent, per-tool
+call frequency and blocks calls that exceed configured thresholds.
+"""
+import asyncio
+import time
+from typing import Any, Protocol, runtime_checkable
+from .types import AgentContext, Effect, ToolRequest
+@runtime_checkable
+class RateLimiter(Protocol):
+    """Protocol for rate limiting backends.
+    Implement this protocol to use a custom backend (Redis, etc.).
+    The InMemoryRateLimiter serves as the reference implementation.
+    """
+    async def check_rate_limit(
+        self, agent_ctx: AgentContext, tool_request: ToolRequest
+    ) -> tuple[bool, str | None, float | None]:
+        """Check whether a tool call should be rate-limited.
+        Returns:
+            (allowed, reason, retry_after)
+            - allowed: True if the call is within limits
+            - reason: Human-readable reason if blocked (None if allowed)
+            - retry_after: Seconds until the window resets (None if allowed)
+        """
+        ...
+class RateLimitRule:
+    """A single rate limit rule parsed from config."""
+    def __init__(
+        self,
+        *,
+        agent_id: str = "*",
+        tool: str = "*",
+        effect: str | None = None,
+        max_calls: int,
+        window_seconds: int,
+    ):
+        self.agent_id = agent_id
+        self.tool = tool
+        self.effect = effect
+        self.max_calls = max_calls
+        self.window_seconds = window_seconds
+    def matches(
+        self, agent_ctx: AgentContext, tool_request: ToolRequest
+    ) -> bool:
+        """Check if this rule applies to the given request."""
+        # Agent match
+        if self.agent_id != "*" and self.agent_id != agent_ctx.agent_id:
+            return False
+        # Tool match (supports prefix wildcard like "mcp:*")
+        if self.tool != "*":
+            if self.tool.endswith("*"):
+                if not tool_request.tool.startswith(self.tool[:-1]):
+                    return False
+            elif self.tool != tool_request.tool:
+                return False
+        # Effect match
+        if self.effect is not None:
+            try:
+                if Effect(self.effect) != tool_request.effect:
+                    return False
+            except ValueError:
+                return False
+        return True
+    def bucket_key(self, agent_ctx: AgentContext) -> str:
+        """Generate a unique bucket key for this rule + agent."""
+        return f"{self.agent_id}|{self.tool}|{self.effect or '*'}|{agent_ctx.agent_id}"
+class InMemoryRateLimiter:
+    """Sliding-window rate limiter with in-memory storage.
+    Config is a list of rule dicts, typically from policy.yaml:
+        rate_limits:
+          - agent_id: "*"
+            tool: "*"
+            max_calls: 100
+            window_seconds: 60
+          - agent_id: "*"
+            effect: "write"
+            max_calls: 10
+            window_seconds: 60
+    """
+    def __init__(self, rules: list[dict[str, Any]] | None = None):
+        self._rules: list[RateLimitRule] = []
+        self._buckets: dict[str, list[float]] = {}
+        self._lock = asyncio.Lock()
+        if rules:
+            for r in rules:
+                self._rules.append(
+                    RateLimitRule(
+                        agent_id=r.get("agent_id", "*"),
+                        tool=r.get("tool", "*"),
+                        effect=r.get("effect"),
+                        max_calls=r["max_calls"],
+                        window_seconds=r["window_seconds"],
+                    )
+                )
+    async def check_rate_limit(
+        self, agent_ctx: AgentContext, tool_request: ToolRequest
+    ) -> tuple[bool, str | None, float | None]:
+        """Check all matching rules. First violation wins."""
+        now = time.time()
+        async with self._lock:
+            for rule in self._rules:
+                if not rule.matches(agent_ctx, tool_request):
+                    continue
+                key = rule.bucket_key(agent_ctx)
+                window_start = now - rule.window_seconds
+                # Get or create bucket, prune expired entries
+                bucket = self._buckets.get(key, [])
+                bucket = [t for t in bucket if t > window_start]
+                self._buckets[key] = bucket
+                if len(bucket) >= rule.max_calls:
+                    # Rate limit exceeded
+                    oldest_in_window = bucket[0] if bucket else now
+                    retry_after = oldest_in_window + rule.window_seconds - now
+                    reason = (
+                        f"Rate limit exceeded: {len(bucket)}/{rule.max_calls} "
+                        f"calls in {rule.window_seconds}s window "
+                        f"(agent={agent_ctx.agent_id}, "
+                        f"tool={rule.tool}, effect={rule.effect or '*'})"
+                    )
+                    return False, reason, max(0.0, retry_after)
+                # Record this call
+                bucket.append(now)
+        return True, None, None
+    async def reset(self, agent_id: str | None = None) -> None:
+        """Clear rate limit state. If agent_id is given, clear only that agent."""
+        async with self._lock:
+            if agent_id is None:
+                self._buckets.clear()
+            else:
+                to_remove = [k for k in self._buckets if k.endswith(f"|{agent_id}")]
+                for k in to_remove:
+                    del self._buckets[k]

tollgate 1.0.4__py3-none-any.whl → 1.4.0__py3-none-any.whl

tollgate 1.0.4py3-none-any.whl → 1.4.0py3-none-any.whl