PyPI - RouteKitAI - Versions diffs - 0.1.0__py3-none-any.whl - Mend

RouteKitAI 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (64) hide show

routekitai/__init__.py +53 -0
routekitai/cli/__init__.py +18 -0
routekitai/cli/main.py +40 -0
routekitai/cli/replay.py +80 -0
routekitai/cli/run.py +95 -0
routekitai/cli/serve.py +966 -0
routekitai/cli/test_agent.py +178 -0
routekitai/cli/trace.py +209 -0
routekitai/cli/trace_analyze.py +120 -0
routekitai/cli/trace_search.py +126 -0
routekitai/core/__init__.py +58 -0
routekitai/core/agent.py +325 -0
routekitai/core/errors.py +49 -0
routekitai/core/hooks.py +174 -0
routekitai/core/memory.py +54 -0
routekitai/core/message.py +132 -0
routekitai/core/model.py +91 -0
routekitai/core/policies.py +373 -0
routekitai/core/policy.py +85 -0
routekitai/core/policy_adapter.py +133 -0
routekitai/core/runtime.py +1403 -0
routekitai/core/tool.py +148 -0
routekitai/core/tools.py +180 -0
routekitai/evals/__init__.py +13 -0
routekitai/evals/dataset.py +75 -0
routekitai/evals/metrics.py +101 -0
routekitai/evals/runner.py +184 -0
routekitai/graphs/__init__.py +12 -0
routekitai/graphs/executors.py +457 -0
routekitai/graphs/graph.py +164 -0
routekitai/memory/__init__.py +13 -0
routekitai/memory/episodic.py +242 -0
routekitai/memory/kv.py +34 -0
routekitai/memory/retrieval.py +192 -0
routekitai/memory/vector.py +700 -0
routekitai/memory/working.py +66 -0
routekitai/message.py +29 -0
routekitai/model.py +48 -0
routekitai/observability/__init__.py +21 -0
routekitai/observability/analyzer.py +314 -0
routekitai/observability/exporters/__init__.py +10 -0
routekitai/observability/exporters/base.py +30 -0
routekitai/observability/exporters/jsonl.py +81 -0
routekitai/observability/exporters/otel.py +119 -0
routekitai/observability/spans.py +111 -0
routekitai/observability/streaming.py +117 -0
routekitai/observability/trace.py +144 -0
routekitai/providers/__init__.py +9 -0
routekitai/providers/anthropic.py +227 -0
routekitai/providers/azure_openai.py +243 -0
routekitai/providers/local.py +196 -0
routekitai/providers/openai.py +321 -0
routekitai/py.typed +0 -0
routekitai/sandbox/__init__.py +12 -0
routekitai/sandbox/filesystem.py +131 -0
routekitai/sandbox/network.py +142 -0
routekitai/sandbox/permissions.py +70 -0
routekitai/tool.py +33 -0
routekitai-0.1.0.dist-info/METADATA +328 -0
routekitai-0.1.0.dist-info/RECORD +64 -0
routekitai-0.1.0.dist-info/WHEEL +5 -0
routekitai-0.1.0.dist-info/entry_points.txt +2 -0
routekitai-0.1.0.dist-info/licenses/LICENSE +21 -0
routekitai-0.1.0.dist-info/top_level.txt +1 -0

routekitai/memory/working.py ADDED Viewed

@@ -0,0 +1,66 @@
+"""Working memory for current run."""
+from typing import Any
+from routekitai.core.memory import Memory
+class WorkingMemory(Memory):
+    """In-memory dict for current run.
+    Ephemeral memory that exists only for the duration of a single agent run.
+    """
+    def __init__(self) -> None:
+        """Initialize working memory."""
+        self._store: dict[str, Any] = {}
+        self._events: list[dict[str, Any]] = []
+    async def get(self, key: str) -> Any:
+        """Get value by key.
+        Args:
+            key: Key to retrieve
+        Returns:
+            Stored value or None if not found
+        """
+        return self._store.get(key)
+    async def set(self, key: str, value: Any) -> None:
+        """Set value by key.
+        Args:
+            key: Key to set
+            value: Value to store
+        """
+        self._store[key] = value
+    async def append(self, event: dict[str, Any]) -> None:
+        """Append an event to memory.
+        Args:
+            event: Event dictionary to append
+        """
+        self._events.append(event)
+    def clear(self) -> None:
+        """Clear all memory (useful for testing)."""
+        self._store.clear()
+        self._events.clear()
+    def get_all(self) -> dict[str, Any]:
+        """Get all stored key-value pairs.
+        Returns:
+            Dictionary of all stored values
+        """
+        return self._store.copy()
+    def get_events(self) -> list[dict[str, Any]]:
+        """Get all events.
+        Returns:
+            List of all events
+        """
+        return self._events.copy()

routekitai/message.py ADDED Viewed

@@ -0,0 +1,29 @@
+"""Message primitive for RouteKit."""
+from enum import Enum
+from typing import Any
+from pydantic import BaseModel, Field
+class MessageRole(str, Enum):
+    """Message role types."""
+    USER = "user"
+    ASSISTANT = "assistant"
+    SYSTEM = "system"
+    TOOL = "tool"
+class Message(BaseModel):
+    """Represents a message in a conversation."""
+    role: MessageRole = Field(..., description="Message role")
+    content: str = Field(..., description="Message content")
+    metadata: dict[str, Any] = Field(default_factory=dict, description="Additional metadata")
+    tool_calls: list[dict[str, Any]] | None = Field(
+        default=None, description="Tool calls associated with this message"
+    )
+    tool_call_id: str | None = Field(
+        default=None, description="ID of the tool call this message responds to"
+    )

routekitai/model.py ADDED Viewed

@@ -0,0 +1,48 @@
+"""Model primitive for RouteKit."""
+from collections.abc import AsyncIterator, Iterator
+from typing import Any
+from pydantic import BaseModel, Field
+from routekitai.core.message import Message
+class Model(BaseModel):
+    """Represents an LLM model interface."""
+    name: str = Field(..., description="Model identifier")
+    provider: str = Field(..., description="Model provider")
+    config: dict[str, Any] = Field(default_factory=dict, description="Model configuration")
+    async def generate(
+        self,
+        messages: list["Message"],
+        **kwargs: Any,
+    ) -> AsyncIterator["Message"]:
+        """Generate a response stream from messages.
+        Args:
+            messages: List of input messages
+            **kwargs: Additional generation parameters
+        Yields:
+            Message chunks from the model
+        """
+        raise NotImplementedError("Subclasses must implement generate")
+    def generate_sync(
+        self,
+        messages: list["Message"],
+        **kwargs: Any,
+    ) -> Iterator["Message"]:
+        """Synchronous wrapper for generate.
+        Args:
+            messages: List of input messages
+            **kwargs: Additional generation parameters
+        Yields:
+            Message chunks from the model
+        """
+        raise NotImplementedError("Subclasses must implement generate_sync")

routekitai/observability/__init__.py ADDED Viewed

@@ -0,0 +1,21 @@
+"""Observability and tracing for RouteKit."""
+from routekitai.observability.analyzer import TraceAnalyzer, TraceMetrics
+from routekitai.observability.exporters.jsonl import JSONLExporter
+from routekitai.observability.exporters.otel import OTELExporter
+from routekitai.observability.spans import Span, SpanContext
+from routekitai.observability.streaming import TraceEventBroadcaster, get_broadcaster
+from routekitai.observability.trace import Trace, TraceCollector
+__all__ = [
+    "Trace",
+    "TraceCollector",
+    "Span",
+    "SpanContext",
+    "JSONLExporter",
+    "OTELExporter",
+    "TraceAnalyzer",
+    "TraceMetrics",
+    "TraceEventBroadcaster",
+    "get_broadcaster",
+]

routekitai/observability/analyzer.py ADDED Viewed

@@ -0,0 +1,314 @@
+"""Trace analysis and metrics calculation."""
+from typing import Any
+from pydantic import BaseModel, Field
+from routekitai.observability.trace import Trace, TraceEvent
+class TraceMetrics(BaseModel):
+    """Metrics calculated from a trace."""
+    model_config = {"protected_namespaces": ()}
+    total_events: int = Field(..., description="Total number of events")
+    total_duration_ms: float = Field(..., description="Total execution duration in milliseconds")
+    model_calls: int = Field(..., description="Number of model calls")
+    tool_calls: int = Field(..., description="Number of tool calls")
+    errors: int = Field(..., description="Number of errors")
+    total_tokens: int = Field(default=0, description="Total tokens used (prompt + completion)")
+    prompt_tokens: int = Field(default=0, description="Prompt tokens")
+    completion_tokens: int = Field(default=0, description="Completion tokens")
+    avg_model_latency_ms: float = Field(default=0.0, description="Average model call latency")
+    avg_tool_latency_ms: float = Field(default=0.0, description="Average tool call latency")
+    error_rate: float = Field(default=0.0, description="Error rate (0.0 to 1.0)")
+    steps: int = Field(default=0, description="Number of execution steps")
+class TraceAnalyzer:
+    """Analyzes traces and calculates metrics."""
+    @staticmethod
+    def analyze(trace: Trace) -> TraceMetrics:
+        """Analyze a trace and calculate metrics.
+        Args:
+            trace: Trace to analyze
+        Returns:
+            Calculated metrics
+        """
+        if not trace.events:
+            return TraceMetrics(
+                total_events=0,
+                total_duration_ms=0.0,
+                model_calls=0,
+                tool_calls=0,
+                errors=0,
+            )
+        # Find start and end times
+        start_time = trace.events[0].timestamp
+        end_time = trace.events[-1].timestamp
+        total_duration_ms = (end_time - start_time) * 1000
+        # Count events
+        model_calls = 0
+        tool_calls = 0
+        errors = 0
+        steps = 0
+        # Token usage
+        total_tokens = 0
+        prompt_tokens = 0
+        completion_tokens = 0
+        # Latency tracking
+        model_latencies: list[float] = []
+        tool_latencies: list[float] = []
+        # Track step start times
+        step_start_times: dict[str, float] = {}
+        for event in trace.events:
+            if event.type == "model_called":
+                model_calls += 1
+                # Extract token usage if available
+                if "usage" in event.data:
+                    usage = event.data["usage"]
+                    if isinstance(usage, dict):
+                        total_tokens += usage.get("total_tokens", 0)
+                        prompt_tokens += usage.get("prompt_tokens", 0)
+                        completion_tokens += usage.get("completion_tokens", 0)
+            elif event.type == "tool_called":
+                tool_calls += 1
+                # Track tool call start time
+                step_id = event.data.get("step_id", "")
+                if step_id:
+                    step_start_times[step_id] = event.timestamp
+            elif event.type == "tool_result":
+                # Calculate tool latency
+                step_id = event.data.get("step_id", "")
+                if step_id and step_id in step_start_times:
+                    latency_ms = (event.timestamp - step_start_times[step_id]) * 1000
+                    tool_latencies.append(latency_ms)
+                    del step_start_times[step_id]
+            elif event.type == "error":
+                errors += 1
+            elif event.type == "step_started":
+                steps += 1
+                step_id = event.data.get("step_id", "")
+                if step_id:
+                    step_start_times[step_id] = event.timestamp
+            elif event.type == "step_completed":
+                # Calculate step latency (could be model or tool)
+                step_id = event.data.get("step_id", "")
+                if step_id and step_id in step_start_times:
+                    latency_ms = (event.timestamp - step_start_times[step_id]) * 1000
+                    # Check if this was a model call step
+                    step_type = event.data.get("step_type", "")
+                    if step_type == "model_call":
+                        model_latencies.append(latency_ms)
+                    elif step_type == "tool_call":
+                        if latency_ms not in tool_latencies:  # Avoid double counting
+                            tool_latencies.append(latency_ms)
+                    del step_start_times[step_id]
+        # Calculate averages
+        avg_model_latency_ms = (
+            sum(model_latencies) / len(model_latencies) if model_latencies else 0.0
+        )
+        avg_tool_latency_ms = sum(tool_latencies) / len(tool_latencies) if tool_latencies else 0.0
+        # Calculate error rate
+        total_operations = model_calls + tool_calls
+        error_rate = errors / total_operations if total_operations > 0 else 0.0
+        return TraceMetrics(
+            total_events=len(trace.events),
+            total_duration_ms=total_duration_ms,
+            model_calls=model_calls,
+            tool_calls=tool_calls,
+            errors=errors,
+            total_tokens=total_tokens,
+            prompt_tokens=prompt_tokens,
+            completion_tokens=completion_tokens,
+            avg_model_latency_ms=avg_model_latency_ms,
+            avg_tool_latency_ms=avg_tool_latency_ms,
+            error_rate=error_rate,
+            steps=steps,
+        )
+    @staticmethod
+    def query(
+        trace: Trace,
+        event_type: str | None = None,
+        filter_func: Any | None = None,
+    ) -> list[TraceEvent]:
+        """Query trace events.
+        Args:
+            trace: Trace to query
+            event_type: Optional event type filter
+            filter_func: Optional function to filter events (takes TraceEvent, returns bool)
+        Returns:
+            List of matching events
+        """
+        events = trace.events
+        if event_type:
+            events = [e for e in events if e.type == event_type]
+        if filter_func:
+            events = [e for e in events if filter_func(e)]
+        return events
+    @staticmethod
+    def search(
+        trace: Trace,
+        query: str,
+        search_in_data: bool = True,
+    ) -> list[TraceEvent]:
+        """Search trace events by text.
+        Args:
+            trace: Trace to search
+            query: Search query (case-insensitive)
+            search_in_data: Whether to search in event data
+        Returns:
+            List of matching events
+        """
+        query_lower = query.lower()
+        results: list[TraceEvent] = []
+        for event in trace.events:
+            # Search in event type
+            if query_lower in event.type.lower():
+                results.append(event)
+                continue
+            # Search in event data
+            if search_in_data:
+                if _search_in_dict(event.data, query_lower):
+                    results.append(event)
+        return results
+    @staticmethod
+    def get_timeline(trace: Trace) -> list[dict[str, Any]]:
+        """Get timeline of events with relative timestamps.
+        Args:
+            trace: Trace to analyze
+        Returns:
+            List of timeline entries with relative time and duration
+        """
+        if not trace.events:
+            return []
+        start_time = trace.events[0].timestamp
+        timeline: list[dict[str, Any]] = []
+        for i, event in enumerate(trace.events):
+            relative_time_ms = (event.timestamp - start_time) * 1000
+            # Calculate duration if this is a completion event
+            duration_ms = 0.0
+            if event.type in ("step_completed", "tool_result", "model_called"):
+                # Look for corresponding start event
+                step_id = event.data.get("step_id", "")
+                if step_id:
+                    # Find the start event
+                    for prev_event in reversed(trace.events[:i]):
+                        if (
+                            prev_event.type in ("step_started", "tool_called", "model_called")
+                            and prev_event.data.get("step_id") == step_id
+                        ):
+                            duration_ms = (event.timestamp - prev_event.timestamp) * 1000
+                            break
+            timeline.append(
+                {
+                    "event": event,
+                    "relative_time_ms": relative_time_ms,
+                    "duration_ms": duration_ms,
+                    "index": i,
+                }
+            )
+        return timeline
+    @staticmethod
+    def get_step_sequence(trace: Trace) -> list[dict[str, Any]]:
+        """Get step-by-step execution sequence.
+        Args:
+            trace: Trace to analyze
+        Returns:
+            List of steps with their events
+        """
+        steps: dict[str, dict[str, Any]] = {}
+        step_order: list[str] = []
+        for event in trace.events:
+            step_id = event.data.get("step_id", "")
+            if not step_id:
+                continue
+            if step_id not in steps:
+                steps[step_id] = {
+                    "step_id": step_id,
+                    "step_type": event.data.get("step_type", ""),
+                    "events": [],
+                    "start_time": event.timestamp,
+                    "end_time": None,
+                    "duration_ms": 0.0,
+                    "error": None,
+                }
+                step_order.append(step_id)
+            steps[step_id]["events"].append(event)
+            if event.type == "step_completed":
+                steps[step_id]["end_time"] = event.timestamp
+                steps[step_id]["duration_ms"] = (
+                    event.timestamp - steps[step_id]["start_time"]
+                ) * 1000
+                if "error" in event.data:
+                    steps[step_id]["error"] = event.data["error"]
+            elif event.type == "error":
+                steps[step_id]["error"] = event.data.get("message", "Unknown error")
+        return [steps[step_id] for step_id in step_order]
+def _search_in_dict(data: dict[str, Any], query: str) -> bool:
+    """Recursively search for query in dictionary values.
+    Args:
+        data: Dictionary to search
+        query: Search query (lowercase)
+    Returns:
+        True if query found
+    """
+    for key, value in data.items():
+        if query in key.lower():
+            return True
+        if isinstance(value, str) and query in value.lower():
+            return True
+        if isinstance(value, dict) and _search_in_dict(value, query):
+            return True
+        if isinstance(value, list):
+            for item in value:
+                if isinstance(item, str) and query in item.lower():
+                    return True
+                if isinstance(item, dict) and _search_in_dict(item, query):
+                    return True
+    return False

routekitai/observability/exporters/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+"""Trace exporters for RouteKit."""
+# TODO: Implement trace exporters
+from routekitai.observability.exporters.jsonl import JSONLExporter
+from routekitai.observability.exporters.otel import OTELExporter
+__all__ = [
+    "JSONLExporter",
+    "OTELExporter",
+]

routekitai/observability/exporters/base.py ADDED Viewed

@@ -0,0 +1,30 @@
+"""Base interface for trace exporters."""
+from abc import ABC, abstractmethod
+from routekitai.observability.trace import Trace
+class TraceExporter(ABC):
+    """Abstract base class for trace exporters."""
+    @abstractmethod
+    async def export(self, trace: Trace) -> None:
+        """Export a trace.
+        Args:
+            trace: Trace to export
+        """
+        raise NotImplementedError
+    @abstractmethod
+    async def load(self, trace_id: str) -> Trace | None:
+        """Load a trace by ID.
+        Args:
+            trace_id: Trace ID to load
+        Returns:
+            Trace if found, None otherwise
+        """
+        raise NotImplementedError

routekitai/observability/exporters/jsonl.py ADDED Viewed

@@ -0,0 +1,81 @@
+"""JSONL trace exporter."""
+import json
+from pathlib import Path
+from typing import Any
+from pydantic import BaseModel, Field
+from routekitai.observability.exporters.base import TraceExporter
+from routekitai.observability.trace import Trace, TraceEvent
+class JSONLExporter(TraceExporter, BaseModel):
+    """Exports traces to JSONL format.
+    Writes one event per line to .routekit/traces/<trace_id>.jsonl
+    """
+    output_dir: Path = Field(..., description="Output directory for JSONL files")
+    def __init__(self, output_dir: Path | str | None = None, **kwargs: Any) -> None:
+        """Initialize JSONL exporter.
+        Args:
+            output_dir: Output directory (defaults to .routekit/traces)
+            **kwargs: Additional fields
+        """
+        if output_dir is None:
+            output_dir = Path(".routekit") / "traces"
+        if isinstance(output_dir, str):
+            output_dir = Path(output_dir)
+        super().__init__(output_dir=output_dir, **kwargs)
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+    async def export(self, trace: Trace) -> None:
+        """Export trace to JSONL file.
+        Args:
+            trace: Trace to export
+        """
+        # Ensure directory exists
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+        trace_file = self.output_dir / f"{trace.trace_id}.jsonl"
+        with trace_file.open("w") as f:
+            for event in trace.events:
+                # Use mode='json' to ensure all data is JSON-serializable
+                f.write(json.dumps(event.model_dump(mode="json")) + "\n")
+    async def load(self, trace_id: str) -> Trace | None:
+        """Load trace from JSONL file.
+        Args:
+            trace_id: Trace ID to load
+        Returns:
+            Trace if found, None otherwise
+        """
+        trace_file = self.output_dir / f"{trace_id}.jsonl"
+        if not trace_file.exists():
+            return None
+        events: list[TraceEvent] = []
+        with trace_file.open("r") as f:
+            for line in f:
+                line = line.strip()
+                if not line:
+                    continue
+                event_data = json.loads(line)
+                events.append(TraceEvent(**event_data))
+        if not events:
+            return None
+        # Extract metadata from run_started event if present
+        metadata = {}
+        for event in events:
+            if event.type == "run_started" and "metadata" in event.data:
+                metadata = event.data.get("metadata", {})
+                break
+        return Trace(trace_id=trace_id, events=events, metadata=metadata)