PyPI - swarmkit - Versions diffs - 0.1.34__py3-none-any.whl - Mend

swarmkit 0.1.34__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

bridge/__init__.py +5 -0
bridge/dist/bridge.bundle.cjs +8 -0
swarmkit/__init__.py +152 -0
swarmkit/agent.py +480 -0
swarmkit/bridge.py +475 -0
swarmkit/config.py +92 -0
swarmkit/pipeline/__init__.py +59 -0
swarmkit/pipeline/pipeline.py +487 -0
swarmkit/pipeline/types.py +272 -0
swarmkit/prompts/__init__.py +126 -0
swarmkit/prompts/agent_md/judge.md +30 -0
swarmkit/prompts/agent_md/reduce.md +7 -0
swarmkit/prompts/agent_md/verify.md +33 -0
swarmkit/prompts/user/judge.md +1 -0
swarmkit/prompts/user/retry_feedback.md +9 -0
swarmkit/prompts/user/verify.md +1 -0
swarmkit/results.py +45 -0
swarmkit/retry.py +133 -0
swarmkit/schema.py +107 -0
swarmkit/swarm/__init__.py +75 -0
swarmkit/swarm/results.py +140 -0
swarmkit/swarm/swarm.py +1751 -0
swarmkit/swarm/types.py +193 -0
swarmkit/utils.py +82 -0
swarmkit-0.1.34.dist-info/METADATA +80 -0
swarmkit-0.1.34.dist-info/RECORD +29 -0
swarmkit-0.1.34.dist-info/WHEEL +5 -0
swarmkit-0.1.34.dist-info/licenses/LICENSE +24 -0
swarmkit-0.1.34.dist-info/top_level.txt +2 -0

swarmkit/__init__.py ADDED Viewed

@@ -0,0 +1,152 @@
+"""SwarmKit Python SDK - Pythonic wrapper around the TypeScript SwarmKit SDK."""
+from .agent import SwarmKit
+from .config import (
+    AgentConfig,
+    E2BProvider,
+    SandboxProvider,
+    AgentType,
+    WorkspaceMode,
+    ReasoningEffort,
+    ValidationMode,
+    SchemaOptions,
+)
+from .results import AgentResponse, ExecuteResult, OutputResult
+from .utils import read_local_dir, save_local_dir
+from .bridge import (
+    SandboxNotFoundError,
+    BridgeConnectionError,
+    BridgeBuildError,
+)
+from .retry import RetryConfig, OnItemRetryCallback, execute_with_retry
+from .swarm import (
+    Swarm,
+    SwarmConfig,
+    BestOfConfig,
+    VerifyConfig,
+    SwarmResult,
+    SwarmResultList,
+    ReduceResult,
+    BestOfResult,
+    BestOfInfo,
+    VerifyInfo,
+    IndexedMeta,
+    ReduceMeta,
+    JudgeMeta,
+    VerifyMeta,
+    VerifyDecision,
+    is_swarm_result,
+    # Callback types
+    OnCandidateCompleteCallback,
+    OnJudgeCompleteCallback,
+    OnWorkerCompleteCallback,
+    OnVerifierCompleteCallback,
+)
+from .pipeline import (
+    Pipeline,
+    TerminalPipeline,
+    MapConfig,
+    FilterConfig,
+    ReduceConfig,
+    StepResult,
+    PipelineResult,
+    PipelineEvents,
+    StepStartEvent,
+    StepCompleteEvent,
+    StepErrorEvent,
+    ItemRetryEvent,
+    WorkerCompleteEvent,
+    VerifierCompleteEvent,
+    CandidateCompleteEvent,
+    JudgeCompleteEvent,
+    EmitOption,
+)
+__version__ = '0.1.34'
+__all__ = [
+    # Main classes
+    'SwarmKit',
+    'Swarm',
+    'Pipeline',
+    'TerminalPipeline',
+    # SwarmKit Configuration
+    'AgentConfig',
+    'E2BProvider',
+    'SandboxProvider',
+    'AgentType',
+    'WorkspaceMode',
+    'ReasoningEffort',
+    'ValidationMode',
+    'SchemaOptions',
+    # SwarmKit Results
+    'AgentResponse',
+    'ExecuteResult',  # Backward compatibility alias for AgentResponse
+    'OutputResult',
+    # Swarm Configuration
+    'SwarmConfig',
+    'BestOfConfig',
+    'VerifyConfig',
+    # Swarm Results
+    'SwarmResult',
+    'SwarmResultList',
+    'ReduceResult',
+    'BestOfResult',
+    'BestOfInfo',
+    'VerifyInfo',
+    'VerifyDecision',
+    # Swarm Metadata
+    'IndexedMeta',
+    'ReduceMeta',
+    'JudgeMeta',
+    'VerifyMeta',
+    # Swarm Helpers
+    'is_swarm_result',
+    # Swarm Callback types
+    'OnCandidateCompleteCallback',
+    'OnJudgeCompleteCallback',
+    'OnWorkerCompleteCallback',
+    'OnVerifierCompleteCallback',
+    # Pipeline Configuration
+    'MapConfig',
+    'FilterConfig',
+    'ReduceConfig',
+    # Pipeline Results
+    'StepResult',
+    'PipelineResult',
+    # Pipeline Events
+    'PipelineEvents',
+    'StepStartEvent',
+    'StepCompleteEvent',
+    'StepErrorEvent',
+    'ItemRetryEvent',
+    'WorkerCompleteEvent',
+    'VerifierCompleteEvent',
+    'CandidateCompleteEvent',
+    'JudgeCompleteEvent',
+    'EmitOption',
+    # Retry
+    'RetryConfig',
+    'OnItemRetryCallback',
+    'execute_with_retry',
+    # Utilities
+    'read_local_dir',
+    'save_local_dir',
+    # Exceptions
+    'SandboxNotFoundError',
+    'BridgeConnectionError',
+    'BridgeBuildError',
+]

swarmkit/agent.py ADDED Viewed

@@ -0,0 +1,480 @@
+"""Main SwarmKit class for Python SDK."""
+import asyncio
+import base64
+import json
+from typing import Any, Callable, Dict, List, Optional, Type, Union
+from .bridge import BridgeManager, SandboxNotFoundError
+from .config import AgentConfig, SandboxProvider, SchemaOptions, WorkspaceMode
+from .results import AgentResponse, ExecuteResult, OutputResult
+from .schema import is_pydantic_model, is_dataclass, to_json_schema, validate_and_parse
+from .utils import _encode_files_for_transport, _filter_none
+class SwarmKit:
+    """SwarmKit agent orchestrator.
+    Provides a Pythonic interface to the TypeScript SwarmKit SDK via JSON-RPC bridge.
+    Example:
+        >>> from swarmkit import SwarmKit
+        >>>
+        >>> # Minimal usage - uses SWARMKIT_API_KEY and E2B_API_KEY env vars
+        >>> async with SwarmKit() as swarmkit:
+        ...     result = await swarmkit.run(prompt='Analyze data.csv')
+        ...     output = await swarmkit.get_output_files()
+        ...     for name, content in output.files.items():
+        ...         print(f'{name}: {len(content)} bytes')
+        >>>
+        >>> # Or with explicit config
+        >>> from swarmkit import AgentConfig, E2BProvider
+        >>> swarmkit = SwarmKit(
+        ...     config=AgentConfig(type='codex', api_key='sk-...'),
+        ...     sandbox=E2BProvider(api_key='...')
+        ... )
+    """
+    def __init__(
+        self,
+        config: Optional[AgentConfig] = None,
+        sandbox: Optional[SandboxProvider] = None,
+        working_directory: str = '/home/user/workspace',
+        workspace_mode: WorkspaceMode = 'knowledge',
+        system_prompt: Optional[str] = None,
+        context: Optional[Dict[str, Union[str, bytes]]] = None,
+        files: Optional[Dict[str, Union[str, bytes]]] = None,
+        mcp_servers: Optional[Dict[str, Any]] = None,
+        secrets: Optional[Dict[str, str]] = None,
+        sandbox_id: Optional[str] = None,
+        session_tag_prefix: Optional[str] = None,
+        schema: Optional[Union[Type, Dict[str, Any]]] = None,
+        schema_options: Optional[SchemaOptions] = None,
+    ):
+        """Initialize SwarmKit.
+        Args:
+            config: Agent configuration (optional - defaults to SWARMKIT_API_KEY env var with 'claude' type)
+            sandbox: Sandbox provider (optional - defaults to E2B with E2B_API_KEY env var)
+            working_directory: Working directory in sandbox (default: /home/user/workspace)
+            workspace_mode: Workspace setup mode - 'knowledge' (creates output/context/scripts/temp folders + default prompt)
+                          or 'swe' (clean workspace for cloned repos) (default: 'knowledge')
+            system_prompt: Custom system prompt (appended to default in 'knowledge' mode, sole prompt in 'swe' mode)
+            context: Files to upload to context/ folder on first run - { "filename.txt": "content" }
+            files: Files to upload to working directory on first run - { "scripts/run.sh": "content" }
+            mcp_servers: MCP server configurations
+            secrets: Environment variables for sandbox
+            sandbox_id: Existing sandbox ID to reconnect to
+            session_tag_prefix: Optional semantic label for observability log files (e.g., 'experiment-7')
+            schema: Schema for structured output - Pydantic model, dataclass, or JSON Schema dict
+            schema_options: Validation options (mode: 'strict' or 'loose', default: 'loose')
+        """
+        self.config = config
+        self.sandbox = sandbox
+        self.working_directory = working_directory
+        self.workspace_mode = workspace_mode
+        self.system_prompt = system_prompt
+        self.context = context
+        self.files = files
+        self.mcp_servers = mcp_servers
+        self.secrets = secrets
+        self.sandbox_id = sandbox_id
+        self.session_tag_prefix = session_tag_prefix
+        self.schema_options = schema_options or SchemaOptions()
+        # Schema handling: store original + convert to JSON Schema
+        self._schema = schema
+        self._schema_json = to_json_schema(schema)
+        self.bridge = BridgeManager()
+        self._initialized = False
+        self._init_lock = asyncio.Lock()
+    async def _ensure_initialized(self):
+        """Ensure bridge is started and agent is initialized."""
+        async with self._init_lock:
+            if self._initialized:
+                return
+            await self.bridge.start()
+            # Build params with _filter_none to exclude None values
+            # TS SDK resolves defaults from env vars when not provided
+            params = _filter_none({
+                # Agent config (optional - TS SDK resolves from SWARMKIT_API_KEY)
+                'agent_type': self.config.type if self.config else None,
+                'api_key': self.config.api_key if self.config else None,
+                'model': self.config.model if self.config else None,
+                'reasoning_effort': self.config.reasoning_effort if self.config else None,
+                'betas': self.config.betas if self.config else None,
+                # Sandbox (optional - TS SDK resolves from E2B_API_KEY)
+                'sandbox_provider': {'type': self.sandbox.type, 'config': self.sandbox.config} if self.sandbox else None,
+                # Other settings
+                'working_directory': self.working_directory,
+                'workspace_mode': self.workspace_mode,
+                'system_prompt': self.system_prompt,
+                'context': _encode_files_for_transport(self.context) if self.context else None,
+                'files': _encode_files_for_transport(self.files) if self.files else None,
+                'mcp_servers': self.mcp_servers,
+                'secrets': self.secrets,
+                'sandbox_id': self.sandbox_id,
+                'session_tag_prefix': self.session_tag_prefix,
+                'schema': self._schema_json,
+                'schema_options': {'mode': self.schema_options.mode} if self._schema_json else None,
+                # Always forward events
+                'forward_stdout': True,
+                'forward_stderr': True,
+                'forward_content': True,
+            })
+            await self.bridge.call('initialize', params)
+            self._initialized = True
+    def on(self, event_type: str, callback: Callable[[Any], None]):
+        """Register event callback.
+        Args:
+            event_type: Event type ('stdout' | 'stderr' | 'content')
+            callback: Callback function invoked with the event payload
+                      (str for stdout/stderr, dict for content)
+        Example:
+            >>> swarmkit.on('stdout', lambda data: print(data, end=''))
+            >>> swarmkit.on('stderr', lambda data: print(f'[ERR] {data}', end=''))
+            >>> swarmkit.on('content', lambda event: print(event['update']['sessionUpdate']))
+        """
+        self.bridge.on(event_type, callback)
+    def _get_rpc_timeout_s(self, timeout_ms: Optional[int]) -> float:
+        """Compute an RPC timeout aligned with sandbox execution timeout."""
+        if timeout_ms is None:
+            timeout_ms = getattr(self.sandbox, "timeout_ms", 3600000) if self.sandbox else 3600000
+        # Add small grace to allow bridge/agent cleanup after sandbox timeout.
+        return timeout_ms / 1000.0 + 30.0
+    async def run(
+        self,
+        prompt: str,
+        timeout_ms: Optional[int] = None,
+        background: bool = False,
+    ) -> AgentResponse:
+        """Run AI-assisted task (agent decides and acts).
+        Args:
+            prompt: Task description
+            timeout_ms: Optional timeout in milliseconds (default: 1 hour)
+            background: Run in background (default: False). If True, returns immediately
+                       while agent continues running.
+        Returns:
+            AgentResponse with sandbox_id, exit_code, stdout, stderr
+        Example:
+            >>> result = await swarmkit.run(prompt='Analyze data and create report', timeout_ms=600000)
+            >>> # Background execution
+            >>> result = await swarmkit.run(prompt='Long task', background=True)
+        """
+        await self._ensure_initialized()
+        params: Dict[str, Any] = {
+            'prompt': prompt,
+        }
+        if timeout_ms is not None:
+            params['timeout_ms'] = timeout_ms
+        if background:
+            params['background'] = background
+        response = await self.bridge.call(
+            'run',
+            params,
+            timeout_s=self._get_rpc_timeout_s(timeout_ms),
+        )
+        return AgentResponse(
+            sandbox_id=response['sandbox_id'],
+            exit_code=response['exit_code'],
+            stdout=response['stdout'],
+            stderr=response['stderr'],
+        )
+    async def execute_command(
+        self,
+        command: str,
+        timeout_ms: Optional[int] = None,
+        background: bool = False,
+    ) -> AgentResponse:
+        """Execute direct shell command.
+        Args:
+            command: Shell command to execute
+            timeout_ms: Optional timeout in milliseconds (default: 1 hour)
+            background: Run in background (default: False)
+        Returns:
+            AgentResponse with sandbox_id, exit_code, stdout, stderr
+        Example:
+            >>> result = await swarmkit.execute_command(command='python script.py')
+        """
+        await self._ensure_initialized()
+        response = await self.bridge.call(
+            'execute_command',
+            {
+                'command': command,
+                'timeout_ms': timeout_ms,
+                'background': background,
+            },
+            timeout_s=self._get_rpc_timeout_s(timeout_ms),
+        )
+        return AgentResponse(
+            sandbox_id=response['sandbox_id'],
+            exit_code=response['exit_code'],
+            stdout=response['stdout'],
+            stderr=response['stderr'],
+        )
+    async def upload_context(
+        self,
+        files: Dict[str, Union[str, bytes]],
+    ):
+        """Upload files to context/ folder (runtime - immediate upload).
+        Args:
+            files: Dict mapping filename to content - { "filename.txt": "content", "data.json": jsonStr }
+        Example:
+            >>> await swarmkit.upload_context({
+            ...     'spec.json': json.dumps(spec),
+            ...     'readme.txt': 'Project documentation...',
+            ... })
+        """
+        await self._ensure_initialized()
+        await self.bridge.call('upload_context', {
+            'files': _encode_files_for_transport(files),
+        })
+    async def upload_files(
+        self,
+        files: Dict[str, Union[str, bytes]],
+    ):
+        """Upload files to working directory (runtime - immediate upload).
+        Args:
+            files: Dict mapping path to content - { "scripts/run.sh": "#!/bin/bash...", "data/input.csv": csvData }
+        Example:
+            >>> await swarmkit.upload_files({
+            ...     'scripts/setup.sh': '#!/bin/bash\\necho hello',
+            ...     'temp/cache.json': json.dumps(cache),
+            ... })
+        """
+        await self._ensure_initialized()
+        await self.bridge.call('upload_files', {
+            'files': _encode_files_for_transport(files),
+        })
+    async def get_output_files(self, recursive: bool = False) -> OutputResult:
+        """Get output files with optional schema validation result.
+        Returns files modified after the last run() call, along with schema
+        validation results if a schema was configured.
+        Matches TypeScript SDK's getOutputFiles() for exact parity.
+        Evidence: sdk-ts/src/types.ts OutputResult<T> interface
+        Args:
+            recursive: Include files in subdirectories (default: False)
+        Returns:
+            OutputResult containing:
+                - files: Dict mapping filename/path to content (str for text, bytes for binary)
+                - data: Parsed and validated result.json data (None if no schema or validation failed)
+                - error: Validation or parse error message, if any
+                - raw_data: Raw result.json string when parse or validation failed
+        Example:
+            >>> output = await swarmkit.get_output_files()
+            >>> for name, content in output.files.items():
+            ...     with open(f'./downloads/{name}', 'wb') as f:
+            ...         f.write(content if isinstance(content, bytes) else content.encode())
+            >>> if output.data:
+            ...     print(f"Validated data: {output.data}")
+            >>> if output.error:
+            ...     print(f"Validation error: {output.error}")
+        """
+        await self._ensure_initialized()
+        response = await self.bridge.call('get_output_files', {'recursive': recursive})
+        # Decode files from transport encoding
+        files: Dict[str, Union[str, bytes]] = {}
+        for name, file_data in response.get('files', {}).items():
+            content = file_data['content']
+            encoding = file_data.get('encoding')
+            if encoding == 'base64':
+                content = base64.b64decode(content)
+            files[name] = content
+        data = None
+        error = None
+        raw_data = None
+        # CASE 1: Pydantic model or dataclass → Native Python validation
+        if is_pydantic_model(self._schema) or is_dataclass(self._schema):
+            raw_json = files.get('result.json')
+            if raw_json is None:
+                error = "Schema provided but agent did not create output/result.json"
+            else:
+                if isinstance(raw_json, bytes):
+                    raw_json = raw_json.decode('utf-8')
+                try:
+                    strict = self.schema_options.mode == 'strict'
+                    data = validate_and_parse(raw_json, self._schema, strict=strict)
+                except Exception as e:
+                    error = f"Schema validation failed: {e}"
+                    raw_data = raw_json
+        # CASE 2: JSON Schema dict → Use TS validation (backward compatible)
+        elif self._schema_json is not None:
+            data = response.get('data')
+            error = response.get('error')
+            raw_data = response.get('raw_data')
+        # CASE 3: No schema → Just return files (data stays None)
+        return OutputResult(
+            files=files,
+            data=data,
+            error=error,
+            raw_data=raw_data,
+        )
+    async def get_session(self) -> Optional[str]:
+        """Get sandbox ID for reuse.
+        Returns:
+            Sandbox ID or None if not initialized
+        Example:
+            >>> sandbox_id = await swarmkit.get_session()
+            >>> print(f'Sandbox ID: {sandbox_id}')
+        """
+        await self._ensure_initialized()
+        return await self.bridge.call('get_session')
+    async def set_session(self, session_id: str):
+        """Change sandbox session.
+        Args:
+            session_id: New sandbox ID to connect to
+        Example:
+            >>> await swarmkit.set_session('existing-sandbox-id')
+        """
+        await self._ensure_initialized()
+        await self.bridge.call('set_session', {
+            'session_id': session_id,
+        })
+    async def pause(self):
+        """Pause sandbox to save costs while preserving state.
+        Example:
+            >>> await swarmkit.pause()
+        """
+        await self._ensure_initialized()
+        await self.bridge.call('pause')
+    async def resume(self):
+        """Resume paused sandbox.
+        Example:
+            >>> await swarmkit.resume()
+        """
+        await self._ensure_initialized()
+        await self.bridge.call('resume')
+    async def kill(self):
+        """Terminate sandbox and release all resources.
+        Example:
+            >>> await swarmkit.kill()
+        """
+        await self._ensure_initialized()
+        try:
+            await self.bridge.call('kill')
+        finally:
+            # Always stop bridge even if RPC fails (e.g., sandbox already gone)
+            await self.bridge.stop()
+            self._initialized = False
+    async def get_host(self, port: int) -> str:
+        """Get public URL for sandbox port.
+        Args:
+            port: Port number to expose
+        Returns:
+            Public URL for the port
+        Example:
+            >>> url = await swarmkit.get_host(8000)
+            >>> print(f'Server available at: {url}')
+        """
+        await self._ensure_initialized()
+        response = await self.bridge.call('get_host', {
+            'port': port,
+        })
+        return response['url']
+    async def get_session_tag(self) -> Optional[str]:
+        """Get the observability session tag.
+        Returns the generated tag (e.g., 'my-prefix-a3f8b2c1') used for the
+        log file in ~/.swarmkit/observability/sessions/
+        Returns:
+            Session tag or None if not initialized
+        Example:
+            >>> tag = await swarmkit.get_session_tag()
+            >>> print(f'Log file tag: {tag}')
+            'experiment-7-a3f8b2c1'
+        """
+        await self._ensure_initialized()
+        return await self.bridge.call('get_session_tag')
+    async def get_session_timestamp(self) -> Optional[str]:
+        """Get the session start timestamp (ISO format).
+        Returns:
+            ISO timestamp when session was created or None if not initialized
+        Example:
+            >>> timestamp = await swarmkit.get_session_timestamp()
+            >>> print(f'Session started: {timestamp}')
+            '2025-01-15T10:30:45.123Z'
+        """
+        await self._ensure_initialized()
+        return await self.bridge.call('get_session_timestamp')
+    async def __aenter__(self):
+        """Context manager entry."""
+        try:
+            await self._ensure_initialized()
+            return self
+        except Exception:
+            # Cleanup bridge process if initialization fails
+            await self.bridge.stop()
+            raise
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        """Context manager exit - cleanup resources."""
+        try:
+            await self.kill()
+        except Exception as e:
+            import warnings
+            warnings.warn(f"Error during cleanup: {e}", RuntimeWarning)