PyPI - fleet-python - Versions diffs - 0.2.66b2__py3-none-any.whl → 0.2.105__py3-none-any.whl - Mend

fleet-python 0.2.66b2py3-none-any.whl → 0.2.105py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

examples/export_tasks.py +16 -5
examples/export_tasks_filtered.py +245 -0
examples/fetch_tasks.py +230 -0
examples/import_tasks.py +140 -8
examples/iterate_verifiers.py +725 -0
fleet/__init__.py +128 -5
fleet/_async/__init__.py +27 -3
fleet/_async/base.py +24 -9
fleet/_async/client.py +938 -41
fleet/_async/env/client.py +60 -3
fleet/_async/instance/client.py +52 -7
fleet/_async/models.py +15 -0
fleet/_async/resources/api.py +200 -0
fleet/_async/resources/sqlite.py +1801 -46
fleet/_async/tasks.py +122 -25
fleet/_async/verifiers/bundler.py +22 -21
fleet/_async/verifiers/verifier.py +25 -19
fleet/agent/__init__.py +32 -0
fleet/agent/gemini_cua/Dockerfile +45 -0
fleet/agent/gemini_cua/__init__.py +10 -0
fleet/agent/gemini_cua/agent.py +759 -0
fleet/agent/gemini_cua/mcp/main.py +108 -0
fleet/agent/gemini_cua/mcp_server/__init__.py +5 -0
fleet/agent/gemini_cua/mcp_server/main.py +105 -0
fleet/agent/gemini_cua/mcp_server/tools.py +178 -0
fleet/agent/gemini_cua/requirements.txt +5 -0
fleet/agent/gemini_cua/start.sh +30 -0
fleet/agent/orchestrator.py +854 -0
fleet/agent/types.py +49 -0
fleet/agent/utils.py +34 -0
fleet/base.py +34 -9
fleet/cli.py +1061 -0
fleet/client.py +1060 -48
fleet/config.py +1 -1
fleet/env/__init__.py +16 -0
fleet/env/client.py +60 -3
fleet/eval/__init__.py +15 -0
fleet/eval/uploader.py +231 -0
fleet/exceptions.py +8 -0
fleet/instance/client.py +53 -8
fleet/instance/models.py +1 -0
fleet/models.py +303 -0
fleet/proxy/__init__.py +25 -0
fleet/proxy/proxy.py +453 -0
fleet/proxy/whitelist.py +244 -0
fleet/resources/api.py +200 -0
fleet/resources/sqlite.py +1845 -46
fleet/tasks.py +113 -20
fleet/utils/__init__.py +7 -0
fleet/utils/http_logging.py +178 -0
fleet/utils/logging.py +13 -0
fleet/utils/playwright.py +440 -0
fleet/verifiers/bundler.py +22 -21
fleet/verifiers/db.py +985 -1
fleet/verifiers/decorator.py +1 -1
fleet/verifiers/verifier.py +25 -19
{fleet_python-0.2.66b2.dist-info → fleet_python-0.2.105.dist-info}/METADATA +28 -1
fleet_python-0.2.105.dist-info/RECORD +115 -0
{fleet_python-0.2.66b2.dist-info → fleet_python-0.2.105.dist-info}/WHEEL +1 -1
fleet_python-0.2.105.dist-info/entry_points.txt +2 -0
tests/test_app_method.py +85 -0
tests/test_expect_exactly.py +4148 -0
tests/test_expect_only.py +2593 -0
tests/test_instance_dispatch.py +607 -0
tests/test_sqlite_resource_dual_mode.py +263 -0
tests/test_sqlite_shared_memory_behavior.py +117 -0
fleet_python-0.2.66b2.dist-info/RECORD +0 -81
tests/test_verifier_security.py +0 -427
{fleet_python-0.2.66b2.dist-info → fleet_python-0.2.105.dist-info}/licenses/LICENSE +0 -0
{fleet_python-0.2.66b2.dist-info → fleet_python-0.2.105.dist-info}/top_level.txt +0 -0

fleet/_async/client.py CHANGED Viewed

@@ -17,11 +17,17 @@
 import asyncio
 import base64
 import cloudpickle
+import dataclasses
 import httpx
 import json
 import logging
 import os
-from typing import List, Optional, Dict, Any, TYPE_CHECKING
+from datetime import date, datetime
+from decimal import Decimal
+from enum import Enum
+from pathlib import Path
+from typing import List, Optional, Dict, Any, TYPE_CHECKING, Union
+from uuid import UUID
 from .base import EnvironmentBase, AsyncWrapper
 from ..models import (
@@ -35,18 +41,125 @@ from ..models import (
     TaskRequest,
     TaskResponse,
     TaskUpdateRequest,
+    Run,
+    HeartbeatResponse,
+    SessionIngestRequest,
+    SessionIngestMessage,
+    SessionIngestResponse,
+    SessionStatus,
+    JobSessionsResponse,
+    SessionTranscriptResponse,
 )
 from .tasks import Task
 if TYPE_CHECKING:
     from .verifiers import AsyncVerifierFunction
+def _json_default(x: Any) -> Any:
+    """Default JSON serializer for non-native types."""
+    if isinstance(x, (datetime, date)):
+        return x.isoformat()
+    if isinstance(x, (UUID, Path)):
+        return str(x)
+    if isinstance(x, Decimal):
+        return float(x)
+    if isinstance(x, Enum):
+        return x.value
+    if isinstance(x, bytes):
+        return base64.b64encode(x).decode("utf-8")
+    if isinstance(x, set):
+        return list(x)
+    if dataclasses.is_dataclass(x) and not isinstance(x, type):
+        return dataclasses.asdict(x)
+    # Handle objects with __dict__ (generic objects)
+    if hasattr(x, "__dict__"):
+        return x.__dict__
+    raise TypeError(f"Not JSON serializable: {type(x)}")
+def _to_dict(obj: Any) -> Any:
+    """Convert any object to a JSON-serializable dict/value.
+    Handles:
+    - Pydantic v2 models (model_dump)
+    - Pydantic v1 models (.dict())
+    - dataclasses (asdict)
+    - TypedDict (just dict at runtime)
+    - Objects with __dict__
+    - Primitives pass through
+    """
+    if obj is None:
+        return None
+    # Pydantic v2
+    if hasattr(obj, "model_dump"):
+        return obj.model_dump()
+    # Pydantic v1
+    if hasattr(obj, "dict") and callable(obj.dict):
+        return obj.dict()
+    # dataclass
+    if dataclasses.is_dataclass(obj) and not isinstance(obj, type):
+        return dataclasses.asdict(obj)
+    # Already a dict or list - recursively convert
+    if isinstance(obj, dict):
+        return {k: _to_dict(v) for k, v in obj.items()}
+    if isinstance(obj, list):
+        return [_to_dict(v) for v in obj]
+    # Primitives
+    if isinstance(obj, (str, int, float, bool, type(None))):
+        return obj
+    # bytes -> base64
+    if isinstance(obj, bytes):
+        return base64.b64encode(obj).decode("utf-8")
+    # datetime/date
+    if isinstance(obj, (datetime, date)):
+        return obj.isoformat()
+    # UUID, Path
+    if isinstance(obj, (UUID, Path)):
+        return str(obj)
+    # Enum
+    if isinstance(obj, Enum):
+        return obj.value
+    # Decimal
+    if isinstance(obj, Decimal):
+        return float(obj)
+    # set
+    if isinstance(obj, set):
+        return list(obj)
+    # Generic object with __dict__
+    if hasattr(obj, "__dict__"):
+        return {k: _to_dict(v) for k, v in obj.__dict__.items() if not k.startswith("_")}
+    # Fallback - try to convert, or return string representation
+    try:
+        json.dumps(obj)
+        return obj
+    except (TypeError, ValueError):
+        return str(obj)
 from .instance import (
     AsyncInstanceClient,
     ResetRequest,
     ResetResponse,
     ExecuteFunctionResponse,
 )
+from ..instance.models import (
+    Resource as ResourceModel,
+    ResourceType,
+    ResourceMode,
+)
 from ..config import (
     DEFAULT_MAX_RETRIES,
     DEFAULT_TIMEOUT,
@@ -59,10 +172,171 @@ from .resources.base import Resource
 from .resources.sqlite import AsyncSQLiteResource
 from .resources.browser import AsyncBrowserResource
 from .resources.mcp import AsyncMCPResource
+from .resources.api import AsyncAPIResource
 logger = logging.getLogger(__name__)
+class AsyncSession:
+    """A session for logging agent interactions to Fleet.
+    This provides a simple interface for streaming messages during an agent run.
+    Messages are sent one-by-one as they happen.
+    Usage:
+        session = await fleet.session_async(
+            model="anthropic/claude-sonnet-4",
+            task_key="my_task",
+            instance_id=env.instance_id,
+        )
+        # Log messages as they happen
+        await session.log(history, response)
+        # Complete when done
+        await session.complete()  # or session.fail()
+    """
+    def __init__(
+        self,
+        client: "AsyncFleet",
+        session_id: Optional[str] = None,
+        job_id: Optional[str] = None,
+        config: Optional[Any] = None,
+        model: Optional[str] = None,
+        task_key: Optional[str] = None,
+        instance_id: Optional[str] = None,
+    ):
+        self.session_id = session_id
+        self.job_id = job_id
+        self.config = config
+        self.model = model
+        self.task_key = task_key
+        self.instance_id = instance_id
+        self._client = client
+        self._message_count = 0
+        self._logged_count = 0  # Track how many messages from history have been logged
+        self._config_sent = False  # Only send config/model/task_key/instance_id on first log
+    async def log(self, history: List[Any], response: Any) -> SessionIngestResponse:
+        """Log an LLM call to the session.
+        Pass the input history and the model response. The session tracks what's
+        already been logged and only sends new messages. Objects are automatically
+        serialized to JSON (supports Pydantic, dataclasses, TypedDict, etc.).
+        Example:
+            response = model.generate(history)
+            await session.log(history, response.content)
+        Args:
+            history: The input messages sent to the model
+            response: The model's response (any serializable object)
+        Returns:
+            SessionIngestResponse with updated message count
+        """
+        # Collect new history messages since last call
+        new_history = history[self._logged_count:]
+        # Update tracked count to include the response we're about to send
+        # This prevents the response from being sent again as "new history" in the next call
+        self._logged_count = len(history) + (1 if response is not None else 0)
+        # Build the payload - serialize history + response to JSON
+        payload: Dict[str, Any] = {
+            "history": [_to_dict(msg) for msg in new_history],
+            "response": _to_dict(response),
+        }
+        if self.session_id:
+            payload["session_id"] = self.session_id
+        if self.job_id:
+            payload["job_id"] = self.job_id
+        # Include config, model, task_key, instance_id on first log only
+        if not self._config_sent:
+            if self.config is not None:
+                payload["config"] = _to_dict(self.config)
+            if self.model is not None:
+                payload["model"] = self.model
+            if self.task_key is not None:
+                payload["task_key"] = self.task_key
+            if self.instance_id is not None:
+                payload["instance_id"] = self.instance_id
+            self._config_sent = True
+        if not new_history and response is None:
+            return SessionIngestResponse(
+                success=True,
+                session_id=self.session_id or "",
+                message_count=self._message_count,
+                created_new_session=False,
+            )
+        result = await self._client._ingest_raw(payload=payload)
+        self._message_count = result.message_count
+        # Update session_id if this was the first log (new session created)
+        if not self.session_id and result.session_id:
+            self.session_id = result.session_id
+        return result
+    async def complete(
+        self,
+        verifier_execution_id: Optional[str] = None,
+    ) -> SessionIngestResponse:
+        """Mark the session as completed successfully.
+        Args:
+            verifier_execution_id: Optional ID of the verifier execution record
+        Returns:
+            SessionIngestResponse with final state
+        """
+        from datetime import datetime
+        payload: Dict[str, Any] = {
+            "session_id": self.session_id,
+            "status": "completed",
+            "ended_at": datetime.now().isoformat(),
+        }
+        if verifier_execution_id:
+            payload["verifier_execution_id"] = verifier_execution_id
+        response = await self._client._ingest_raw(payload)
+        self._message_count = response.message_count
+        return response
+    async def fail(
+        self,
+        verifier_execution_id: Optional[str] = None,
+    ) -> SessionIngestResponse:
+        """Mark the session as failed.
+        Args:
+            verifier_execution_id: Optional ID of the verifier execution record
+        Returns:
+            SessionIngestResponse with final state
+        """
+        from datetime import datetime
+        payload: Dict[str, Any] = {
+            "session_id": self.session_id,
+            "status": "failed",
+            "ended_at": datetime.now().isoformat(),
+        }
+        if verifier_execution_id:
+            payload["verifier_execution_id"] = verifier_execution_id
+        response = await self._client._ingest_raw(payload)
+        self._message_count = response.message_count
+        return response
+    @property
+    def message_count(self) -> int:
+        """Get the current message count."""
+        return self._message_count
 class AsyncEnv(EnvironmentBase):
     def __init__(self, client: Optional[AsyncWrapper], **kwargs):
         super().__init__(**kwargs)
@@ -112,6 +386,29 @@ class AsyncEnv(EnvironmentBase):
     def browser(self, name: str = "cdp") -> AsyncBrowserResource:
         return self.instance.browser(name)
+    def api(self, name: str = "api") -> AsyncAPIResource:
+        """Get an API resource for making HTTP requests to the app's API.
+        Args:
+            name: Name for the API resource (default: "api")
+        Returns:
+            AsyncAPIResource for making HTTP requests
+        """
+        # Use urls.api if available, otherwise fall back to urls.root + "/raw"
+        if self.urls and self.urls.api:
+            base_url = self.urls.api
+        elif self.urls and self.urls.root:
+            base_url = f"{self.urls.root.rstrip('/')}/raw"
+        elif self._manager_url_override and self._manager_url_override != "local://":
+            # URL mode: strip /api/v1/env suffix to get root URL
+            base_url = self._manager_url_override.rstrip('/')
+            if base_url.endswith('/api/v1/env'):
+                base_url = base_url[:-len('/api/v1/env')]
+        else:
+            raise ValueError("No API URL configured for this environment")
+        return self.instance.api(name, base_url)
     @property
     def mcp(self) -> AsyncMCPResource:
         mcp_url = f"{self.urls.root}mcp"
@@ -126,6 +423,23 @@ class AsyncEnv(EnvironmentBase):
     async def close(self) -> InstanceResponse:
         return await _delete_instance(self._load_client, self.instance_id)
+    async def heartbeat(self) -> HeartbeatResponse:
+        """Send heartbeat to keep instance alive (if heartbeat monitoring is enabled).
+        Returns:
+            HeartbeatResponse containing heartbeat status and deadline information
+        """
+        body = {}
+        if self.heartbeat_region:
+            body["region"] = self.heartbeat_region
+        response = await self._load_client.request(
+            "POST",
+            f"/v1/env/instances/{self.instance_id}/heartbeat",
+            json=body
+        )
+        return HeartbeatResponse(**response.json())
     async def verify(self, validator: ValidatorType) -> ExecuteFunctionResponse:
         return await self.instance.verify(validator)
@@ -148,6 +462,7 @@ class AsyncEnv(EnvironmentBase):
         kwargs: dict,
         timeout: Optional[int] = 30,
         needs_upload: bool = True,
+        verifier_runtime_version: Optional[str] = None,
     ) -> VerifiersExecuteResponse:
         return await _execute_verifier_remote(
             self._load_client,
@@ -160,6 +475,7 @@ class AsyncEnv(EnvironmentBase):
             kwargs,
             timeout,
             needs_upload,
+            verifier_runtime_version,
         )
     def __getstate__(self):
@@ -212,6 +528,8 @@ class AsyncFleet:
         env_variables: Optional[Dict[str, Any]] = None,
         image_type: Optional[str] = None,
         ttl_seconds: Optional[int] = None,
+        run_id: Optional[str] = None,
+        heartbeat_interval: Optional[int] = None,
     ) -> AsyncEnv:
         if ":" in env_key:
             env_key_part, env_version = env_key.split(":", 1)
@@ -247,6 +565,8 @@ class AsyncFleet:
             image_type=image_type,
             created_from="sdk",
             ttl_seconds=ttl_seconds,
+            run_id=run_id,
+            heartbeat_interval=heartbeat_interval,
         )
         # Only use region-specific base URL if no custom base URL is set
@@ -269,13 +589,17 @@ class AsyncFleet:
         return await self.make(env_key=f"{task.env_id}:{task.version}")
     async def instances(
-        self, status: Optional[str] = None, region: Optional[str] = None
+        self, status: Optional[str] = None, region: Optional[str] = None, run_id: Optional[str] = None, profile_id: Optional[str] = None
     ) -> List[AsyncEnv]:
         params = {}
         if status:
             params["status"] = status
         if region:
             params["region"] = region
+        if run_id:
+            params["run_id"] = run_id
+        if profile_id:
+            params["profile_id"] = profile_id
         response = await self.client.request("GET", "/v1/env/instances", params=params)
         return [
@@ -283,11 +607,163 @@ class AsyncFleet:
             for instance_data in response.json()
         ]
-    async def instance(self, instance_id: str) -> AsyncEnv:
-        response = await self.client.request("GET", f"/v1/env/instances/{instance_id}")
-        instance = AsyncEnv(client=self.client, **response.json())
-        await instance.instance.load()
-        return instance
+    async def instance(self, instance_id: Union[str, Dict[str, str]]) -> AsyncEnv:
+        """Create or connect to an environment instance.
+        Supports three modes based on input type:
+        1. dict: Local filesystem mode - {"current": "./data.db", "seed": "./seed.db"}
+        2. str starting with http:// or https://: Localhost/URL mode
+        3. str (other): Remote cloud instance mode
+        Args:
+            instance_id: Instance identifier (str), URL (str starting with http://),
+                        or local db mapping (dict)
+        Returns:
+            AsyncEnv: Environment instance
+        """
+        # Local filesystem mode - dict of resource names to file paths
+        if isinstance(instance_id, dict):
+            return self._create_local_instance(instance_id)
+        # Localhost/direct URL mode - string starting with http:// or https://
+        elif isinstance(instance_id, str) and instance_id.startswith(("http://", "https://")):
+            return self._create_url_instance(instance_id)
+        # Remote mode - existing behavior
+        else:
+            response = await self.client.request("GET", f"/v1/env/instances/{instance_id}")
+            instance = AsyncEnv(client=self.client, **response.json())
+            await instance.instance.load()
+            return instance
+    def _create_url_instance(self, base_url: str) -> AsyncEnv:
+        """Create instance connected to a direct URL (localhost or custom).
+        Args:
+            base_url: URL of the instance manager API
+        Returns:
+            AsyncEnv: Environment instance configured for URL mode
+        """
+        instance_client = AsyncInstanceClient(url=base_url, httpx_client=self._httpx_client)
+        # Create a minimal environment for URL mode
+        env = AsyncEnv(
+            client=self.client,
+            instance_id=base_url,
+            env_key="localhost",
+            version="",
+            status="running",
+            subdomain="localhost",
+            created_at="",
+            updated_at="",
+            terminated_at=None,
+            team_id="",
+            region="localhost",
+            env_variables=None,
+            data_key=None,
+            data_version=None,
+            urls=None,
+            health=None,
+        )
+        env._instance = instance_client
+        return env
+    @staticmethod
+    def _normalize_db_path(path: str) -> tuple[str, bool]:
+        """Normalize database path and detect if it's in-memory.
+        Args:
+            path: Database path - can be:
+                  - File path: "./data.db"
+                  - Plain memory: ":memory:"
+                  - Named memory: ":memory:namespace"
+                  - URI: "file:name?mode=memory&cache=shared"
+        Returns:
+            Tuple of (normalized_path, is_memory)
+        """
+        import uuid
+        import sqlite3
+        if path == ":memory:":
+            # Plain :memory: - create unique namespace
+            name = f"mem_{uuid.uuid4().hex[:8]}"
+            return f"file:{name}?mode=memory&cache=shared", True
+        elif path.startswith(":memory:"):
+            # Named memory: :memory:current -> file:current?mode=memory&cache=shared
+            namespace = path[8:]  # Remove ":memory:" prefix
+            return f"file:{namespace}?mode=memory&cache=shared", True
+        elif "mode=memory" in path:
+            # Already a proper memory URI
+            return path, True
+        else:
+            # Regular file path
+            return path, False
+    def _create_local_instance(self, dbs: Dict[str, str]) -> AsyncEnv:
+        """Create instance with local file-based or in-memory SQLite resources.
+        Args:
+            dbs: Map of resource names to paths (e.g., {"current": "./data.db"} or
+                 {"current": ":memory:current"})
+        Returns:
+            AsyncEnv: Environment instance configured for local mode
+        """
+        import sqlite3
+        instance_client = AsyncInstanceClient(url="local://", httpx_client=None)
+        instance_client._resources = []  # Mark as loaded
+        instance_client._memory_anchors = {}  # Store anchor connections for in-memory DBs
+        # Store creation parameters for local AsyncSQLiteResources
+        # This allows db() to create new instances each time (matching HTTP mode behavior)
+        for name, path in dbs.items():
+            # Normalize path and detect if it's in-memory
+            normalized_path, is_memory = self._normalize_db_path(path)
+            # Create anchor connection for in-memory databases
+            # This keeps the database alive as long as the env exists
+            if is_memory:
+                anchor_conn = sqlite3.connect(normalized_path, uri=True)
+                instance_client._memory_anchors[name] = anchor_conn
+            resource_model = ResourceModel(
+                name=name,
+                type=ResourceType.db,
+                mode=ResourceMode.rw,
+                label=f"Local: {path}",
+            )
+            instance_client._resources_state[ResourceType.db.value][name] = {
+                'type': 'local',
+                'resource_model': resource_model,
+                'db_path': normalized_path,
+                'is_memory': is_memory
+            }
+        # Create a minimal environment for local mode
+        env = AsyncEnv(
+            client=self.client,
+            instance_id="local",
+            env_key="local",
+            version="",
+            status="running",
+            subdomain="local",
+            created_at="",
+            updated_at="",
+            terminated_at=None,
+            team_id="",
+            region="local",
+            env_variables=None,
+            data_key=None,
+            data_version=None,
+            urls=None,
+            health=None,
+        )
+        env._instance = instance_client
+        return env
     async def check_bundle_exists(self, bundle_hash: str) -> VerifiersCheckResponse:
         return await _check_bundle_exists(self.client, bundle_hash)
@@ -302,6 +778,65 @@ class AsyncFleet:
     async def delete(self, instance_id: str) -> InstanceResponse:
         return await _delete_instance(self.client, instance_id)
+    async def close(self, instance_id: str) -> InstanceResponse:
+        """Close (delete) a specific instance by ID.
+        Args:
+            instance_id: The instance ID to close
+        Returns:
+            InstanceResponse containing the deleted instance details
+        """
+        return await _delete_instance(self.client, instance_id)
+    async def heartbeat(self, instance_id: str, region: Optional[str] = None) -> HeartbeatResponse:
+        """Send heartbeat to keep instance alive (if heartbeat monitoring is enabled).
+        Args:
+            instance_id: The instance ID to send heartbeat for
+            region: Optional region override for cross-region heartbeats
+        Returns:
+            HeartbeatResponse containing heartbeat status and deadline information
+        """
+        return await _send_heartbeat(self.client, instance_id, region)
+    async def close_all(self, run_id: Optional[str] = None, profile_id: Optional[str] = None) -> List[InstanceResponse]:
+        """Close (delete) instances using the batch delete endpoint.
+        Args:
+            run_id: Optional run ID to filter instances by
+            profile_id: Optional profile ID to filter instances by (use "self" for your own profile)
+        Returns:
+            List[InstanceResponse] containing the deleted instances
+        Note:
+            At least one of run_id or profile_id must be provided.
+        """
+        return await _delete_instances_batch(self.client, run_id=run_id, profile_id=profile_id)
+    async def list_runs(
+        self, profile_id: Optional[str] = None, status: Optional[str] = "active"
+    ) -> List[Run]:
+        """List all runs (groups of instances by run_id) with aggregated statistics.
+        Args:
+            profile_id: Optional profile ID to filter runs by (use "self" for your own profile)
+            status: Filter by run status - "active" (default), "inactive", or "all"
+        Returns:
+            List[Run] containing run information with instance counts and timestamps
+        """
+        params = {}
+        if profile_id:
+            params["profile_id"] = profile_id
+        if status:
+            params["active"] = status
+        response = await self.client.request("GET", "/v1/env/runs", params=params)
+        return [Run(**run_data) for run_data in response.json()]
     async def load_tasks_from_file(self, filename: str) -> List[Task]:
         with open(filename, "r", encoding="utf-8") as f:
             tasks_data = f.read()
@@ -368,6 +903,11 @@ class AsyncFleet:
         if not verifier_id:
             verifier_id = task_json.get("key", task_json.get("id"))
+        # Extract verifier_runtime_version from metadata if present
+        verifier_runtime_version = None
+        if "metadata" in task_json and isinstance(task_json["metadata"], dict):
+            verifier_runtime_version = task_json["metadata"].get("verifier_runtime_version")
         try:
             if verifier_id and verifier_code:
                 verifier = await self._create_verifier_from_data(
@@ -375,13 +915,14 @@ class AsyncFleet:
                     verifier_key=task_json.get("key", task_json.get("id")),
                     verifier_code=verifier_code,
                     verifier_sha=verifier_sha,
+                    verifier_runtime_version=verifier_runtime_version,
                 )
         except Exception as e:
             error_msg = f"Failed to create verifier {task_json.get('key', task_json.get('id'))}: {e}"
             if raise_on_verifier_error:
                 raise ValueError(error_msg) from e
-            else:
-                logger.warning(error_msg)
+            # else:
+            #     logger.warning(error_msg)
         task = Task(
             key=task_json.get("key", task_json.get("id")),
@@ -398,7 +939,10 @@ class AsyncFleet:
             verifier=verifier,  # Use created verifier or None
             verifier_id=verifier_id,  # Set verifier_id so _rebuild_verifier works
             verifier_sha=verifier_sha,  # Set verifier_sha
+            verifier_runtime_version=verifier_runtime_version,  # Set verifier_runtime_version
             metadata=task_json.get("metadata", {}),  # Default empty metadata
+            writer_metadata=task_json.get("writer_metadata"),  # Writer metadata
+            qa_metadata=task_json.get("qa_metadata"),  # QA metadata
             output_json_schema=task_json.get("output_json_schema"),  # JSON schema for output
         )
         return task
@@ -473,25 +1017,25 @@ class AsyncFleet:
                                     verifier_sha=tr.verifier.sha256,
                                 )
                             except Exception as e:
-                                logger.warning(
-                                    f"Failed to create verifier {tr.verifier.key}: {e}"
-                                )
+                                # logger.warning(
+                                #     f"Failed to create verifier {tr.verifier.key}: {e}"
+                                # )
                                 return None
                         else:
                             # Fallback: try fetching by ID
                             try:
-                                logger.warning(
-                                    f"Embedded verifier code missing for {tr.verifier.key} (NoSuchKey). "
-                                    f"Attempting to refetch by id {tr.verifier.verifier_id}"
-                                )
+                                # logger.warning(
+                                #     f"Embedded verifier code missing for {tr.verifier.key} (NoSuchKey). "
+                                #     f"Attempting to refetch by id {tr.verifier.verifier_id}"
+                                # )
                                 return await self._load_verifier(
                                     tr.verifier.verifier_id
                                 )
                             except Exception as e:
-                                logger.warning(
-                                    f"Refetch by verifier id failed for {tr.verifier.key}: {e}. "
-                                    "Leaving verifier unset."
-                                )
+                                # logger.warning(
+                                #     f"Refetch by verifier id failed for {tr.verifier.key}: {e}. "
+                                #     "Leaving verifier unset."
+                                # )
                                 return None
                 # Add the coroutine for parallel execution
@@ -530,9 +1074,10 @@ class AsyncFleet:
             if task_response.verifier:
                 # Process verifier result
                 if isinstance(verifier_result, Exception):
-                    logger.warning(
-                        f"Verifier loading failed for {task_response.key}: {verifier_result}"
-                    )
+                    # logger.warning(
+                    #     f"Verifier loading failed for {task_response.key}: {verifier_result}"
+                    # )
+                    pass
                 elif verifier_result is not None:
                     verifier = verifier_result
                     embedded_code = task_response.verifier.code or ""
@@ -542,6 +1087,21 @@ class AsyncFleet:
                     if not is_embedded_error:
                         verifier_func = embedded_code
+            # Extract verifier metadata
+            verifier_id = task_response.verifier_id
+            if not verifier_id and task_response.verifier:
+                verifier_id = task_response.verifier.verifier_id
+            verifier_sha = None
+            if task_response.verifier:
+                verifier_sha = task_response.verifier.sha256
+            # Extract verifier_runtime_version from metadata if present
+            verifier_runtime_version = None
+            metadata = task_response.metadata or {}
+            if isinstance(metadata, dict):
+                verifier_runtime_version = metadata.get("verifier_runtime_version")
             task = Task(
                 key=task_response.key,
                 prompt=task_response.prompt,
@@ -553,7 +1113,12 @@ class AsyncFleet:
                 env_variables=task_response.env_variables or {},
                 verifier_func=verifier_func,  # Set verifier code
                 verifier=verifier,  # Use created verifier or None
-                metadata={},  # Default empty metadata
+                verifier_id=verifier_id,  # Set verifier_id
+                verifier_sha=verifier_sha,  # Set verifier_sha
+                verifier_runtime_version=verifier_runtime_version,  # Set verifier_runtime_version
+                metadata=metadata,
+                writer_metadata=getattr(task_response, "writer_metadata", None),  # Writer metadata
+                qa_metadata=getattr(task_response, "qa_metadata", None),  # QA metadata
                 output_json_schema=getattr(task_response, "output_json_schema", None),  # Get output_json_schema if available
             )
             tasks.append(task)
@@ -606,10 +1171,10 @@ class AsyncFleet:
             with open(filename, "w", encoding="utf-8") as f:
                 json.dump(tasks_data, f, indent=2, default=str)
-            logger.info(f"Exported {len(tasks)} tasks to {filename}")
+            # logger.info(f"Exported {len(tasks)} tasks to {filename}")
             return filename
         else:
-            logger.info("No tasks found to export")
+            # logger.info("No tasks found to export")
             return None
     async def import_single_task(self, task: Task, project_key: Optional[str] = None):
@@ -638,7 +1203,7 @@ class AsyncFleet:
             )
             return response
         except Exception as e:
-            logger.error(f"Failed to import task {task.key}: {e}")
+            # logger.error(f"Failed to import task {task.key}: {e}")
             return None
     async def import_tasks(self, filename: str, project_key: Optional[str] = None):
@@ -708,6 +1273,9 @@ class AsyncFleet:
         task_key: str,
         prompt: Optional[str] = None,
         verifier_code: Optional[str] = None,
+        metadata: Optional[Dict[str, Any]] = None,
+        writer_metadata: Optional[Dict[str, Any]] = None,
+        qa_metadata: Optional[Dict[str, Any]] = None,
     ) -> TaskResponse:
         """Update an existing task.
@@ -715,11 +1283,20 @@ class AsyncFleet:
             task_key: The key of the task to update
             prompt: New prompt text for the task (optional)
             verifier_code: Python code for task verification (optional)
+            metadata: Additional metadata for the task (optional)
+            writer_metadata: Metadata filled by task writer (optional)
+            qa_metadata: Metadata filled by QA reviewer (optional)
         Returns:
             TaskResponse containing the updated task details
         """
-        payload = TaskUpdateRequest(prompt=prompt, verifier_code=verifier_code)
+        payload = TaskUpdateRequest(
+            prompt=prompt,
+            verifier_code=verifier_code,
+            metadata=metadata,
+            writer_metadata=writer_metadata,
+            qa_metadata=qa_metadata,
+        )
         response = await self.client.request(
             "PUT", f"/v1/tasks/{task_key}", json=payload.model_dump(exclude_none=True)
         )
@@ -752,8 +1329,291 @@ class AsyncFleet:
         )
         return TaskResponse(**response.json())
+    # Sessions API methods
+    async def list_job_sessions(self, job_id: str) -> JobSessionsResponse:
+        """List all sessions for a job, grouped by task.
+        Args:
+            job_id: The job ID
+        Returns:
+            JobSessionsResponse containing sessions grouped by task with statistics
+        """
+        response = await self.client.request("GET", f"/v1/sessions/job/{job_id}")
+        return JobSessionsResponse(**response.json())
+    async def get_session_transcript(self, session_id: str) -> SessionTranscriptResponse:
+        """Get the transcript for a specific session.
+        Args:
+            session_id: The session ID
+        Returns:
+            SessionTranscriptResponse containing task, instance, verifier result, and messages
+        """
+        response = await self.client.request(
+            "GET", f"/v1/sessions/{session_id}/transcript"
+        )
+        return SessionTranscriptResponse(**response.json())
+    async def _ingest(
+        self,
+        messages: List[Dict[str, Any]],
+        session_id: Optional[str] = None,
+        model: Optional[str] = None,
+        task_key: Optional[str] = None,
+        job_id: Optional[str] = None,
+        instance_id: Optional[str] = None,
+        status: Optional[str] = None,
+        metadata: Optional[Dict[str, Any]] = None,
+        started_at: Optional[str] = None,
+        ended_at: Optional[str] = None,
+        verifier_execution_id: Optional[str] = None,
+    ) -> SessionIngestResponse:
+        """Internal method to ingest session data."""
+        message_objects = [SessionIngestMessage(**msg) for msg in messages]
+        request = SessionIngestRequest(
+            messages=message_objects,
+            session_id=session_id,
+            model=model,
+            task_key=task_key,
+            job_id=job_id,
+            instance_id=instance_id,
+            status=SessionStatus(status) if status else None,
+            metadata=metadata,
+            started_at=started_at,
+            ended_at=ended_at,
+            verifier_execution_id=verifier_execution_id,
+        )
+        response = await self.client.request(
+            "POST",
+            "/v1/sessions/ingest",
+            json=request.model_dump(exclude_none=True),
+        )
+        return SessionIngestResponse(**response.json())
+    async def _ingest_raw(
+        self,
+        payload: Dict[str, Any],
+    ) -> SessionIngestResponse:
+        """Internal method to ingest raw session data as JSON.
+        This sends the history and response as-is to the backend,
+        letting the backend handle format normalization.
+        """
+        # Pre-serialize with our custom handler to ensure all types are JSON-safe
+        json_str = json.dumps(payload, default=_json_default)
+        clean_payload = json.loads(json_str)
+        response = await self.client.request(
+            "POST",
+            "/v1/traces/logs",
+            json=clean_payload,
+        )
+        return SessionIngestResponse(**response.json())
+    def start_session(
+        self,
+        session_id: Optional[str] = None,
+        job_id: Optional[str] = None,
+        config: Optional[Any] = None,
+        model: Optional[str] = None,
+        task_key: Optional[str] = None,
+        instance_id: Optional[str] = None,
+    ) -> AsyncSession:
+        """Start a new session for logging agent interactions.
+        This returns a Session object. The session is created on the backend
+        when you call log() for the first time.
+        Args:
+            session_id: Optional existing session ID to resume
+            job_id: Optional job ID to associate with the session
+            config: Optional config object (e.g., GenerateContentConfig) to log
+            model: Optional model name to log
+            task_key: Optional Fleet task key
+            instance_id: Optional Fleet instance ID
+        Returns:
+            AsyncSession object with log(), complete(), and fail() methods
+        Example:
+            session = fleet_client.start_session(config=config, model="gpt-4", task_key="task_123")
+            # Log LLM calls during agent run
+            await session.log(history, response)
+            # Complete when done
+            await session.complete()
+        """
+        return AsyncSession(
+            client=self,
+            session_id=session_id,
+            job_id=job_id,
+            config=config,
+            model=model,
+            task_key=task_key,
+            instance_id=instance_id,
+        )
+    async def trace_job(self, name: Optional[str] = None) -> str:
+        """Create a new trace job.
+        Args:
+            name: Name of the job (generated server-side if not provided)
+        Returns:
+            The job_id string
+        """
+        from fleet.models import TraceJobRequest, TraceJobResponse
+        request = TraceJobRequest(name=name)
+        response = await self.client.request(
+            "POST",
+            "/v1/traces/jobs",
+            json=request.model_dump(),
+        )
+        result = TraceJobResponse(**response.json())
+        return result.job_id
+    async def create_session(
+        self,
+        model: Optional[str] = None,
+        task_key: Optional[str] = None,
+        job_id: Optional[str] = None,
+        instance_id: Optional[str] = None,
+        metadata: Optional[Dict[str, Any]] = None,
+        started_at: Optional[str] = None,
+        initial_message: Optional[Dict[str, Any]] = None,
+    ) -> SessionIngestResponse:
+        """Create a new session, optionally with an initial message.
+        This is useful for streaming scenarios where you want to create
+        a session first and then append messages one by one.
+        Args:
+            model: Model identifier (e.g., "anthropic/claude-sonnet-4")
+            task_key: Task key to associate with the session
+            job_id: Job ID to associate with the session
+            instance_id: Instance ID to associate with the session
+            metadata: Additional metadata for the session
+            started_at: ISO timestamp when session started
+            initial_message: Optional first message dict with 'role' and 'content'
+        Returns:
+            SessionIngestResponse containing session_id
+        Example:
+            # Create session and get ID
+            session = await fleet.create_session(
+                model="anthropic/claude-sonnet-4",
+                task_key="my_task",
+                started_at=datetime.now().isoformat()
+            )
+            # Append messages as they happen
+            await fleet.append_message(session.session_id, {"role": "user", "content": "Hello"})
+            await fleet.append_message(session.session_id, {"role": "assistant", "content": "Hi!"})
+        """
+        # Use a placeholder message if none provided
+        if initial_message:
+            messages = [initial_message]
+        else:
+            messages = [{"role": "system", "content": "[session created]"}]
+        return await self._ingest(
+            messages=messages,
+            model=model,
+            task_key=task_key,
+            job_id=job_id,
+            instance_id=instance_id,
+            status="running",
+            metadata=metadata,
+            started_at=started_at,
+        )
+    async def append_message(
+        self,
+        session_id: str,
+        message: Dict[str, Any],
+        status: Optional[str] = None,
+        ended_at: Optional[str] = None,
+    ) -> SessionIngestResponse:
+        """Append a single message to an existing session.
+        This is useful for streaming scenarios where you want to send
+        messages one by one as they happen.
+        Args:
+            session_id: The session ID to append to
+            message: Message dict with 'role' and 'content' keys.
+                Optional keys: 'tool_calls', 'tool_call_id', 'timestamp', 'tokens', 'metadata'
+            status: Optional status update ("running", "completed", "failed")
+            ended_at: ISO timestamp when session ended (set when completing)
+        Returns:
+            SessionIngestResponse with updated message count
+        Example:
+            # Append user message
+            await fleet.append_message(session_id, {"role": "user", "content": "What's 2+2?"})
+            # Append assistant response
+            await fleet.append_message(session_id, {"role": "assistant", "content": "4"})
+            # Complete the session
+            await fleet.append_message(
+                session_id,
+                {"role": "assistant", "content": "Done!"},
+                status="completed",
+                ended_at=datetime.now().isoformat()
+            )
+        """
+        return await self._ingest(
+            messages=[message],
+            session_id=session_id,
+            status=status,
+            ended_at=ended_at,
+        )
+    async def complete_session(
+        self,
+        session_id: str,
+        status: str = "completed",
+        ended_at: Optional[str] = None,
+        final_message: Optional[Dict[str, Any]] = None,
+    ) -> SessionIngestResponse:
+        """Mark a session as complete.
+        Args:
+            session_id: The session ID to complete
+            status: Final status ("completed", "failed", "cancelled")
+            ended_at: ISO timestamp when session ended (defaults to now)
+            final_message: Optional final message to append
+        Returns:
+            SessionIngestResponse with final state
+        """
+        from datetime import datetime as dt
+        if ended_at is None:
+            ended_at = dt.now().isoformat()
+        if final_message:
+            messages = [final_message]
+        else:
+            messages = [{"role": "system", "content": f"[session {status}]"}]
+        return await self._ingest(
+            messages=messages,
+            session_id=session_id,
+            status=status,
+            ended_at=ended_at,
+        )
     async def _create_verifier_from_data(
-        self, verifier_id: str, verifier_key: str, verifier_code: str, verifier_sha: str
+        self, verifier_id: str, verifier_key: str, verifier_code: str, verifier_sha: str, verifier_runtime_version: Optional[str] = None
     ) -> "AsyncVerifierFunction":
         """Create an AsyncVerifierFunction from verifier data.
@@ -774,6 +1634,7 @@ class AsyncFleet:
             verifier_id=verifier_id,
             verifier_key=verifier_key,
             sha256=verifier_sha,
+            verifier_runtime_version=verifier_runtime_version or "",
         )
         # Store the original verifier code for reference
@@ -809,6 +1670,37 @@ async def _delete_instance(client: AsyncWrapper, instance_id: str) -> InstanceRe
     return InstanceResponse(**response.json())
+async def _send_heartbeat(client: AsyncWrapper, instance_id: str, region: Optional[str] = None) -> HeartbeatResponse:
+    """Send heartbeat to keep instance alive."""
+    body = {}
+    if region:
+        body["region"] = region
+    response = await client.request(
+        "POST",
+        f"/v1/env/instances/{instance_id}/heartbeat",
+        json=body
+    )
+    return HeartbeatResponse(**response.json())
+async def _delete_instances_batch(
+    client: AsyncWrapper, run_id: Optional[str] = None, profile_id: Optional[str] = None
+) -> List[InstanceResponse]:
+    """Delete instances using the batch endpoint with flexible filtering."""
+    params = {}
+    if run_id:
+        params["run_id"] = run_id
+    if profile_id:
+        params["profile_id"] = profile_id
+    if not params:
+        raise ValueError("At least one of run_id or profile_id must be provided")
+    response = await client.request("DELETE", "/v1/env/instances/batch", params=params)
+    return [InstanceResponse(**instance_data) for instance_data in response.json()]
 async def _check_bundle_exists(
     client: AsyncWrapper, bundle_hash: str
 ) -> VerifiersCheckResponse:
@@ -827,6 +1719,7 @@ async def _execute_verifier_remote(
     kwargs: dict,
     timeout: Optional[int] = 30,
     needs_upload: bool = True,
+    verifier_runtime_version: Optional[str] = None,
 ) -> VerifiersExecuteResponse:
     # Pickle args and kwargs together
     # The first arg should be None as a placeholder for env
@@ -850,18 +1743,22 @@ async def _execute_verifier_remote(
         bundle_b64 = base64.b64encode(bundle_data).decode("utf-8")
         request_data["bundle"] = bundle_b64
+    # Add verifier_runtime_version if present
+    if verifier_runtime_version:
+        request_data["verifier_runtime_version"] = verifier_runtime_version
     # Debug logging
-    logger.debug(
-        f"Sending verifier execute request: key={key}, sha256={bundle_sha[:8]}..., function_name={function_name}"
-    )
-    logger.debug(f"Request has bundle: {needs_upload}")
-    logger.debug(f"Using client with base_url: {client.base_url}")
-    logger.debug(f"Request data keys: {list(request_data.keys())}")
-    logger.debug(
-        f"Bundle size: {len(request_data.get('bundle', ''))} chars"
-        if "bundle" in request_data
-        else "No bundle"
-    )
+    # logger.debug(
+    #     f"Sending verifier execute request: key={key}, sha256={bundle_sha[:8]}..., function_name={function_name}"
+    # )
+    # logger.debug(f"Request has bundle: {needs_upload}")
+    # logger.debug(f"Using client with base_url: {client.base_url}")
+    # logger.debug(f"Request data keys: {list(request_data.keys())}")
+    # logger.debug(
+    #     f"Bundle size: {len(request_data.get('bundle', ''))} chars"
+    #     if "bundle" in request_data
+    #     else "No bundle"
+    # )
     # Note: This should be called on the instance URL, not the orchestrator
     # The instance has manager URLs for verifier execution
@@ -869,6 +1766,6 @@ async def _execute_verifier_remote(
     # Debug the response
     response_json = response.json()
-    logger.debug(f"Verifier execute response: {response_json}")
+    # logger.debug(f"Verifier execute response: {response_json}")
     return VerifiersExecuteResponse(**response_json)

fleet-python 0.2.66b2__py3-none-any.whl → 0.2.105__py3-none-any.whl

fleet-python 0.2.66b2py3-none-any.whl → 0.2.105py3-none-any.whl