PyPI - openadapt-ml - Versions diffs - 0.2.0__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

openadapt-ml 0.2.0py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (95) hide show

openadapt_ml/baselines/__init__.py +121 -0
openadapt_ml/baselines/adapter.py +185 -0
openadapt_ml/baselines/cli.py +314 -0
openadapt_ml/baselines/config.py +448 -0
openadapt_ml/baselines/parser.py +922 -0
openadapt_ml/baselines/prompts.py +787 -0
openadapt_ml/benchmarks/__init__.py +13 -115
openadapt_ml/benchmarks/agent.py +265 -421
openadapt_ml/benchmarks/azure.py +28 -19
openadapt_ml/benchmarks/azure_ops_tracker.py +521 -0
openadapt_ml/benchmarks/cli.py +1722 -4847
openadapt_ml/benchmarks/trace_export.py +631 -0
openadapt_ml/benchmarks/viewer.py +22 -5
openadapt_ml/benchmarks/vm_monitor.py +530 -29
openadapt_ml/benchmarks/waa_deploy/Dockerfile +47 -53
openadapt_ml/benchmarks/waa_deploy/api_agent.py +21 -20
openadapt_ml/cloud/azure_inference.py +3 -5
openadapt_ml/cloud/lambda_labs.py +722 -307
openadapt_ml/cloud/local.py +2038 -487
openadapt_ml/cloud/ssh_tunnel.py +68 -26
openadapt_ml/datasets/next_action.py +40 -30
openadapt_ml/evals/grounding.py +8 -3
openadapt_ml/evals/plot_eval_metrics.py +15 -13
openadapt_ml/evals/trajectory_matching.py +41 -26
openadapt_ml/experiments/demo_prompt/format_demo.py +16 -6
openadapt_ml/experiments/demo_prompt/run_experiment.py +26 -16
openadapt_ml/experiments/representation_shootout/__init__.py +70 -0
openadapt_ml/experiments/representation_shootout/conditions.py +708 -0
openadapt_ml/experiments/representation_shootout/config.py +390 -0
openadapt_ml/experiments/representation_shootout/evaluator.py +659 -0
openadapt_ml/experiments/representation_shootout/runner.py +687 -0
openadapt_ml/experiments/waa_demo/runner.py +29 -14
openadapt_ml/export/parquet.py +36 -24
openadapt_ml/grounding/detector.py +18 -14
openadapt_ml/ingest/__init__.py +8 -6
openadapt_ml/ingest/capture.py +25 -22
openadapt_ml/ingest/loader.py +7 -4
openadapt_ml/ingest/synthetic.py +189 -100
openadapt_ml/models/api_adapter.py +14 -4
openadapt_ml/models/base_adapter.py +10 -2
openadapt_ml/models/providers/__init__.py +288 -0
openadapt_ml/models/providers/anthropic.py +266 -0
openadapt_ml/models/providers/base.py +299 -0
openadapt_ml/models/providers/google.py +376 -0
openadapt_ml/models/providers/openai.py +342 -0
openadapt_ml/models/qwen_vl.py +46 -19
openadapt_ml/perception/__init__.py +35 -0
openadapt_ml/perception/integration.py +399 -0
openadapt_ml/retrieval/demo_retriever.py +50 -24
openadapt_ml/retrieval/embeddings.py +9 -8
openadapt_ml/retrieval/retriever.py +3 -1
openadapt_ml/runtime/__init__.py +50 -0
openadapt_ml/runtime/policy.py +18 -5
openadapt_ml/runtime/safety_gate.py +471 -0
openadapt_ml/schema/__init__.py +9 -0
openadapt_ml/schema/converters.py +74 -27
openadapt_ml/schema/episode.py +31 -18
openadapt_ml/scripts/capture_screenshots.py +530 -0
openadapt_ml/scripts/compare.py +85 -54
openadapt_ml/scripts/demo_policy.py +4 -1
openadapt_ml/scripts/eval_policy.py +15 -9
openadapt_ml/scripts/make_gif.py +1 -1
openadapt_ml/scripts/prepare_synthetic.py +3 -1
openadapt_ml/scripts/train.py +21 -9
openadapt_ml/segmentation/README.md +920 -0
openadapt_ml/segmentation/__init__.py +97 -0
openadapt_ml/segmentation/adapters/__init__.py +5 -0
openadapt_ml/segmentation/adapters/capture_adapter.py +420 -0
openadapt_ml/segmentation/annotator.py +610 -0
openadapt_ml/segmentation/cache.py +290 -0
openadapt_ml/segmentation/cli.py +674 -0
openadapt_ml/segmentation/deduplicator.py +656 -0
openadapt_ml/segmentation/frame_describer.py +788 -0
openadapt_ml/segmentation/pipeline.py +340 -0
openadapt_ml/segmentation/schemas.py +622 -0
openadapt_ml/segmentation/segment_extractor.py +634 -0
openadapt_ml/training/azure_ops_viewer.py +1097 -0
openadapt_ml/training/benchmark_viewer.py +52 -41
openadapt_ml/training/shared_ui.py +7 -7
openadapt_ml/training/stub_provider.py +57 -35
openadapt_ml/training/trainer.py +143 -86
openadapt_ml/training/trl_trainer.py +70 -21
openadapt_ml/training/viewer.py +323 -108
openadapt_ml/training/viewer_components.py +180 -0
{openadapt_ml-0.2.0.dist-info → openadapt_ml-0.2.1.dist-info}/METADATA +215 -14
openadapt_ml-0.2.1.dist-info/RECORD +116 -0
openadapt_ml/benchmarks/base.py +0 -366
openadapt_ml/benchmarks/data_collection.py +0 -432
openadapt_ml/benchmarks/live_tracker.py +0 -180
openadapt_ml/benchmarks/runner.py +0 -418
openadapt_ml/benchmarks/waa.py +0 -761
openadapt_ml/benchmarks/waa_live.py +0 -619
openadapt_ml-0.2.0.dist-info/RECORD +0 -86
{openadapt_ml-0.2.0.dist-info → openadapt_ml-0.2.1.dist-info}/WHEEL +0 -0
{openadapt_ml-0.2.0.dist-info → openadapt_ml-0.2.1.dist-info}/licenses/LICENSE +0 -0

openadapt_ml/perception/integration.py ADDED Viewed

@@ -0,0 +1,399 @@
+"""
+Integration Bridge between openadapt-grounding and openadapt-ml
+This module provides the UIElementGraph class which wraps parsed UI elements
+from openadapt-grounding parsers and converts them to the openadapt-ml schema.
+Types imported from openadapt-grounding:
+- Parser: Protocol for UI element parsers (OmniParser, UITars, etc.)
+- Element: A detected UI element with normalized bounds
+- LocatorResult: Result of attempting to locate an element
+- RegistryEntry: A stable element that survived temporal filtering
+"""
+from __future__ import annotations
+import uuid
+from collections import Counter
+from typing import Any, Literal, Optional, Union
+from pydantic import BaseModel, Field
+from openadapt_ml.schema.episode import BoundingBox, UIElement
+# Lazy import for openadapt-grounding to make it an optional dependency
+_grounding_available: Optional[bool] = None
+def _check_grounding_available() -> bool:
+    """Check if openadapt-grounding is installed."""
+    global _grounding_available
+    if _grounding_available is None:
+        try:
+            import openadapt_grounding  # noqa: F401
+            _grounding_available = True
+        except ImportError:
+            _grounding_available = False
+    return _grounding_available
+def _get_grounding_types():
+    """Import and return openadapt-grounding types.
+    Raises:
+        ImportError: If openadapt-grounding is not installed
+    """
+    if not _check_grounding_available():
+        raise ImportError(
+            "openadapt-grounding is required for perception integration. "
+            "Install it with: pip install openadapt-grounding"
+        )
+    from openadapt_grounding import Element, LocatorResult, Parser, RegistryEntry
+    return Element, LocatorResult, Parser, RegistryEntry
+# Source types for UI element graphs
+SourceType = Literal["omniparser", "uitars", "ax", "dom", "mixed"]
+def element_to_ui_element(
+    element: Any,  # openadapt_grounding.Element
+    image_width: Optional[int] = None,
+    image_height: Optional[int] = None,
+    element_index: Optional[int] = None,
+    source: Optional[str] = None,
+) -> UIElement:
+    """Convert an openadapt-grounding Element to a schema UIElement.
+    Args:
+        element: Element from openadapt-grounding with normalized bounds
+        image_width: Image width in pixels (for coordinate conversion)
+        image_height: Image height in pixels (for coordinate conversion)
+        element_index: Optional index to use as element_id
+        source: Source parser name (stored in automation_id for reference)
+    Returns:
+        UIElement with converted bounds and properties
+    """
+    Element, _, _, _ = _get_grounding_types()
+    if not isinstance(element, Element):
+        raise TypeError(f"Expected Element, got {type(element)}")
+    # Extract normalized bounds (x, y, width, height)
+    norm_x, norm_y, norm_w, norm_h = element.bounds
+    # Convert to pixel coordinates if dimensions provided
+    if image_width is not None and image_height is not None:
+        bounds = BoundingBox(
+            x=int(norm_x * image_width),
+            y=int(norm_y * image_height),
+            width=int(norm_w * image_width),
+            height=int(norm_h * image_height),
+        )
+    else:
+        # Store normalized as integers (multiply by 10000 for precision)
+        # This allows using BoundingBox which requires int values
+        bounds = BoundingBox(
+            x=int(norm_x * 10000),
+            y=int(norm_y * 10000),
+            width=int(norm_w * 10000),
+            height=int(norm_h * 10000),
+        )
+    # Generate element_id from index if provided
+    element_id = str(element_index) if element_index is not None else None
+    return UIElement(
+        role=element.element_type,
+        name=element.text,
+        bounds=bounds,
+        element_id=element_id,
+        automation_id=source,  # Store source in automation_id for reference
+    )
+def ui_element_to_element(
+    ui_element: UIElement,
+    image_width: Optional[int] = None,
+    image_height: Optional[int] = None,
+) -> Any:  # Returns openadapt_grounding.Element
+    """Convert a schema UIElement back to an openadapt-grounding Element.
+    Useful for evaluation or when passing elements back to grounding functions.
+    Args:
+        ui_element: UIElement from openadapt-ml schema
+        image_width: Image width in pixels (for coordinate normalization)
+        image_height: Image height in pixels (for coordinate normalization)
+    Returns:
+        Element with normalized bounds
+    """
+    Element, _, _, _ = _get_grounding_types()
+    if ui_element.bounds is None:
+        # Return element with zero bounds if no bounds available
+        return Element(
+            bounds=(0.0, 0.0, 0.0, 0.0),
+            text=ui_element.name,
+            element_type=ui_element.role or "unknown",
+            confidence=1.0,
+        )
+    # Convert pixel coordinates to normalized
+    if image_width is not None and image_height is not None:
+        norm_x = ui_element.bounds.x / image_width
+        norm_y = ui_element.bounds.y / image_height
+        norm_w = ui_element.bounds.width / image_width
+        norm_h = ui_element.bounds.height / image_height
+    else:
+        # Assume bounds are already in 10000-scale normalized format
+        norm_x = ui_element.bounds.x / 10000
+        norm_y = ui_element.bounds.y / 10000
+        norm_w = ui_element.bounds.width / 10000
+        norm_h = ui_element.bounds.height / 10000
+    return Element(
+        bounds=(norm_x, norm_y, norm_w, norm_h),
+        text=ui_element.name,
+        element_type=ui_element.role or "unknown",
+        confidence=1.0,
+    )
+class UIElementGraph(BaseModel):
+    """A graph of UI elements parsed from a screenshot.
+    This class wraps a list of UIElement objects and tracks their source
+    (which parser produced them). It provides a bridge between openadapt-grounding
+    parsers and the openadapt-ml schema system.
+    Attributes:
+        graph_id: Unique identifier for this graph (UUID)
+        elements: List of UIElement objects
+        source: Primary source parser ("omniparser", "uitars", "ax", "dom", "mixed")
+        source_summary: Count of elements by source (e.g., {"omniparser": 15, "ax": 8})
+        timestamp_ms: Optional timestamp when the screenshot was captured
+        image_width: Original image width (for coordinate reference)
+        image_height: Original image height (for coordinate reference)
+    Example:
+        >>> from openadapt_grounding import OmniParserClient
+        >>> from openadapt_ml.perception import UIElementGraph
+        >>>
+        >>> parser = OmniParserClient(endpoint="http://localhost:8000")
+        >>> elements = parser.parse(image)
+        >>> graph = UIElementGraph.from_parser_output(elements, "omniparser")
+        >>> print(f"Found {len(graph.elements)} elements")
+    """
+    graph_id: str = Field(
+        default_factory=lambda: str(uuid.uuid4()),
+        description="Unique identifier for this graph",
+    )
+    elements: list[UIElement] = Field(
+        default_factory=list,
+        description="List of UI elements in the graph",
+    )
+    source: SourceType = Field(
+        default="mixed",
+        description="Primary source parser for the elements",
+    )
+    source_summary: dict[str, int] = Field(
+        default_factory=dict,
+        description="Count of elements by source",
+    )
+    timestamp_ms: Optional[int] = Field(
+        None,
+        description="Timestamp when the screenshot was captured (milliseconds)",
+    )
+    image_width: Optional[int] = Field(
+        None,
+        description="Original image width in pixels",
+    )
+    image_height: Optional[int] = Field(
+        None,
+        description="Original image height in pixels",
+    )
+    @classmethod
+    def from_parser_output(
+        cls,
+        elements: list[Any],  # list[openadapt_grounding.Element]
+        source: Union[SourceType, str],
+        image_width: Optional[int] = None,
+        image_height: Optional[int] = None,
+        timestamp_ms: Optional[int] = None,
+    ) -> "UIElementGraph":
+        """Create a UIElementGraph from parser output.
+        Args:
+            elements: List of Element objects from openadapt-grounding parser
+            source: Parser source name ("omniparser", "uitars", "ax", "dom")
+            image_width: Image width in pixels (for coordinate conversion)
+            image_height: Image height in pixels (for coordinate conversion)
+            timestamp_ms: Optional timestamp when screenshot was captured
+        Returns:
+            UIElementGraph with converted UIElement objects
+        """
+        # Validate source type
+        valid_sources = {"omniparser", "uitars", "ax", "dom", "mixed"}
+        if source not in valid_sources:
+            # Allow custom sources but warn
+            pass
+        # Convert elements
+        ui_elements = [
+            element_to_ui_element(
+                element=el,
+                image_width=image_width,
+                image_height=image_height,
+                element_index=i,
+                source=source,
+            )
+            for i, el in enumerate(elements)
+        ]
+        # Build source summary
+        source_summary = {source: len(elements)}
+        return cls(
+            elements=ui_elements,
+            source=source if source in valid_sources else "mixed",
+            source_summary=source_summary,
+            timestamp_ms=timestamp_ms,
+            image_width=image_width,
+            image_height=image_height,
+        )
+    @classmethod
+    def merge(
+        cls,
+        graphs: list["UIElementGraph"],
+        deduplicate_iou_threshold: Optional[float] = None,
+    ) -> "UIElementGraph":
+        """Merge multiple UIElementGraphs into one.
+        Args:
+            graphs: List of UIElementGraph objects to merge
+            deduplicate_iou_threshold: If provided, remove duplicate elements
+                with IoU greater than this threshold (0.0-1.0)
+        Returns:
+            New UIElementGraph with combined elements
+        """
+        if not graphs:
+            return cls()
+        # Combine all elements
+        all_elements: list[UIElement] = []
+        source_counts: Counter[str] = Counter()
+        for graph in graphs:
+            all_elements.extend(graph.elements)
+            for src, count in graph.source_summary.items():
+                source_counts[src] += count
+        # Get image dimensions from first graph that has them
+        image_width = None
+        image_height = None
+        for graph in graphs:
+            if graph.image_width is not None:
+                image_width = graph.image_width
+                image_height = graph.image_height
+                break
+        # TODO: Implement deduplication by IoU if threshold provided
+        # For now, just combine all elements
+        return cls(
+            elements=all_elements,
+            source="mixed" if len(source_counts) > 1 else list(source_counts.keys())[0],
+            source_summary=dict(source_counts),
+            timestamp_ms=graphs[0].timestamp_ms if graphs else None,
+            image_width=image_width,
+            image_height=image_height,
+        )
+    def to_dict(self) -> dict[str, Any]:
+        """Convert to JSON-serializable dictionary.
+        Returns:
+            Dictionary representation suitable for JSON serialization
+        """
+        return self.model_dump()
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "UIElementGraph":
+        """Create from dictionary.
+        Args:
+            data: Dictionary representation
+        Returns:
+            UIElementGraph instance
+        """
+        return cls.model_validate(data)
+    def get_element_by_id(self, element_id: str) -> Optional[UIElement]:
+        """Find element by ID.
+        Args:
+            element_id: Element ID to search for
+        Returns:
+            UIElement if found, None otherwise
+        """
+        for element in self.elements:
+            if element.element_id == element_id:
+                return element
+        return None
+    def get_elements_by_role(self, role: str) -> list[UIElement]:
+        """Find elements by role.
+        Args:
+            role: Role to filter by (e.g., "button", "textbox")
+        Returns:
+            List of matching UIElements
+        """
+        return [el for el in self.elements if el.role == role]
+    def get_elements_by_text(
+        self,
+        text: str,
+        exact: bool = False,
+    ) -> list[UIElement]:
+        """Find elements by text content.
+        Args:
+            text: Text to search for
+            exact: If True, require exact match; if False, use substring match
+        Returns:
+            List of matching UIElements
+        """
+        results = []
+        for el in self.elements:
+            if el.name is None:
+                continue
+            if exact:
+                if el.name == text:
+                    results.append(el)
+            else:
+                if text.lower() in el.name.lower():
+                    results.append(el)
+        return results
+    def __len__(self) -> int:
+        """Return number of elements in the graph."""
+        return len(self.elements)
+    def __iter__(self):
+        """Iterate over elements."""
+        return iter(self.elements)

openadapt_ml/retrieval/demo_retriever.py CHANGED Viewed

@@ -32,7 +32,6 @@ Example usage:
 from __future__ import annotations
-import hashlib
 import json
 import logging
 from dataclasses import dataclass, field
@@ -206,11 +205,15 @@ class DemoRetriever:
             platform = self._detect_platform(episode, app_name, domain)
         # Extract action types
-        action_types = list(set(
-            step.action.type.value if hasattr(step.action.type, 'value') else str(step.action.type)
-            for step in episode.steps
-            if step.action
-        ))
+        action_types = list(
+            set(
+                step.action.type.value
+                if hasattr(step.action.type, "value")
+                else str(step.action.type)
+                for step in episode.steps
+                if step.action
+            )
+        )
         # Extract key elements
         key_elements = self._extract_key_elements(episode)
@@ -297,9 +300,13 @@ class DemoRetriever:
             return
         if not self._demos:
-            raise ValueError("Cannot build index: no demos added. Use add_demo() first.")
+            raise ValueError(
+                "Cannot build index: no demos added. Use add_demo() first."
+            )
-        logger.info(f"Building index for {len(self._demos)} demos using {self.embedding_method}...")
+        logger.info(
+            f"Building index for {len(self._demos)} demos using {self.embedding_method}..."
+        )
         # Initialize embedder if needed
         if self._embedder is None:
@@ -358,16 +365,21 @@ class DemoRetriever:
             }
         with open(path / "index.json", "w") as f:
-            json.dump({
-                "embedding_method": self.embedding_method,
-                "embedding_model": self.embedding_model,
-                "demos": metadata,
-                "embedder_state": embedder_state,
-            }, f, indent=2)
+            json.dump(
+                {
+                    "embedding_method": self.embedding_method,
+                    "embedding_model": self.embedding_model,
+                    "demos": metadata,
+                    "embedder_state": embedder_state,
+                },
+                f,
+                indent=2,
+            )
         # Save embeddings as numpy array
         try:
             import numpy as np
             if self._embeddings_matrix is not None:
                 np.save(path / "embeddings.npy", self._embeddings_matrix)
         except ImportError:
@@ -375,7 +387,11 @@ class DemoRetriever:
         logger.info(f"Index saved to {path}")
-    def load_index(self, path: Union[str, Path], episode_loader: Optional[Callable[[str], Episode]] = None) -> None:
+    def load_index(
+        self,
+        path: Union[str, Path],
+        episode_loader: Optional[Callable[[str], Episode]] = None,
+    ) -> None:
         """Load index from disk.
         Args:
@@ -395,6 +411,7 @@ class DemoRetriever:
         embeddings = None
         try:
             import numpy as np
             embeddings_path = path / "embeddings.npy"
             if embeddings_path.exists():
                 embeddings = np.load(embeddings_path)
@@ -409,11 +426,14 @@ class DemoRetriever:
                 try:
                     episode = episode_loader(meta["file_path"])
                 except Exception as e:
-                    logger.warning(f"Failed to load episode from {meta['file_path']}: {e}")
+                    logger.warning(
+                        f"Failed to load episode from {meta['file_path']}: {e}"
+                    )
             # Create placeholder episode if not loaded
             if episode is None:
                 from openadapt_ml.schema import Action, ActionType, Observation, Step
                 episode = Episode(
                     episode_id=meta["demo_id"],
                     instruction=meta["goal"],
@@ -454,6 +474,7 @@ class DemoRetriever:
         embedder_state = data.get("embedder_state", {})
         if embedder_state and self.embedding_method == "tfidf":
             from openadapt_ml.retrieval.embeddings import TFIDFEmbedder
             self._embedder = TFIDFEmbedder()
             self._embedder.vocab = embedder_state.get("vocab", [])
             self._embedder.vocab_to_idx = embedder_state.get("vocab_to_idx", {})
@@ -512,12 +533,14 @@ class DemoRetriever:
             bonus = self._compute_context_bonus(demo, app_context, domain_context)
             total_score = text_score + bonus
-            results.append(RetrievalResult(
-                demo=demo,
-                score=total_score,
-                text_score=text_score,
-                domain_bonus=bonus,
-            ))
+            results.append(
+                RetrievalResult(
+                    demo=demo,
+                    score=total_score,
+                    text_score=text_score,
+                    domain_bonus=bonus,
+                )
+            )
         # Sort by score (descending)
         results.sort(key=lambda r: r.score, reverse=True)
@@ -618,6 +641,7 @@ class DemoRetriever:
     def _format_action_minimal(self, action: Any) -> str:
         """Format action as minimal string."""
         from openadapt_ml.experiments.demo_prompt.format_demo import format_action
         return format_action(action)
     # =========================================================================
@@ -628,10 +652,12 @@ class DemoRetriever:
         """Initialize the embedding backend."""
         if self.embedding_method == "tfidf":
             from openadapt_ml.retrieval.embeddings import TFIDFEmbedder
             self._embedder = TFIDFEmbedder()
         elif self.embedding_method == "sentence_transformers":
             from openadapt_ml.retrieval.embeddings import SentenceTransformerEmbedder
             self._embedder = SentenceTransformerEmbedder(
                 model_name=self.embedding_model,
                 cache_dir=self.cache_dir / "st_cache",
@@ -639,6 +665,7 @@ class DemoRetriever:
         elif self.embedding_method == "openai":
             from openadapt_ml.retrieval.embeddings import OpenAIEmbedder
             self._embedder = OpenAIEmbedder(
                 model_name=self.embedding_model,
                 cache_dir=self.cache_dir / "openai_cache",
@@ -739,8 +766,7 @@ class DemoRetriever:
         if filter_tags:
             filter_tags_set = set(filter_tags)
             candidates = [
-                d for d in candidates
-                if filter_tags_set.issubset(set(d.tags))
+                d for d in candidates if filter_tags_set.issubset(set(d.tags))
             ]
         return candidates

openadapt_ml/retrieval/embeddings.py CHANGED Viewed

@@ -25,9 +25,9 @@ import logging
 import re
 from abc import ABC, abstractmethod
 from collections import Counter
-from math import log, sqrt
+from math import log
 from pathlib import Path
-from typing import Any, Dict, List, Optional, Union
+from typing import Any, Dict, List, Optional
 logger = logging.getLogger(__name__)
@@ -121,7 +121,7 @@ class TFIDFEmbedder(BaseEmbedder):
         Returns:
             List of tokens.
         """
-        tokens = re.findall(r'\b\w+\b', text.lower())
+        tokens = re.findall(r"\b\w+\b", text.lower())
         return tokens
     def _compute_tf(self, tokens: List[str]) -> Dict[str, float]:
@@ -169,8 +169,7 @@ class TFIDFEmbedder(BaseEmbedder):
         # Compute IDF: log(N / df) + 1
         n_docs = max(len(documents), 1)
         self.idf = {
-            term: log(n_docs / doc_freq.get(term, 1)) + 1
-            for term in self.vocab
+            term: log(n_docs / doc_freq.get(term, 1)) + 1 for term in self.vocab
         }
         self._is_fitted = True
@@ -440,6 +439,7 @@ class OpenAIEmbedder(BaseEmbedder):
                     cached = json.load(f)
                     # Convert lists back to arrays
                     import numpy as np
                     for key, val in cached.items():
                         self._embedding_cache[key] = np.array(val, dtype=np.float32)
                 logger.debug(f"Loaded {len(self._embedding_cache)} cached embeddings")
@@ -455,8 +455,7 @@ class OpenAIEmbedder(BaseEmbedder):
         try:
             # Convert arrays to lists for JSON
             cache_data = {
-                key: val.tolist()
-                for key, val in self._embedding_cache.items()
+                key: val.tolist() for key, val in self._embedding_cache.items()
             }
             with open(cache_file, "w") as f:
                 json.dump(cache_data, f)
@@ -525,7 +524,9 @@ class OpenAIEmbedder(BaseEmbedder):
             # Process in batches
             for batch_start in range(0, len(uncached_texts), self.batch_size):
-                batch_texts = uncached_texts[batch_start:batch_start + self.batch_size]
+                batch_texts = uncached_texts[
+                    batch_start : batch_start + self.batch_size
+                ]
                 try:
                     response = client.embeddings.create(

openadapt_ml/retrieval/retriever.py CHANGED Viewed

@@ -49,7 +49,9 @@ class DemoRetriever:
         if index.is_empty():
             raise ValueError("Cannot create retriever from empty index")
         if not index.is_fitted():
-            raise ValueError("Index must be built before retrieval (call index.build())")
+            raise ValueError(
+                "Index must be built before retrieval (call index.build())"
+            )
         self.index = index
         self.domain_bonus = domain_bonus

openadapt_ml/runtime/__init__.py CHANGED Viewed

@@ -0,0 +1,50 @@
+"""
+Runtime module for GUI automation agents.
+This module provides:
+- AgentPolicy: Runtime policy wrapper for VLM-based action prediction
+- SafetyGate: Deterministic safety checks for action validation
+Example usage:
+    from openadapt_ml.runtime import AgentPolicy, SafetyGate, SafetyConfig, SafetyDecision
+    # Create policy and safety gate
+    policy = AgentPolicy(adapter)
+    gate = SafetyGate(SafetyConfig(confidence_threshold=0.8))
+    # In agent loop
+    action, thought, state, raw = policy.predict_action_from_sample(sample)
+    assessment = gate.assess(action, observation)
+    if assessment.decision == SafetyDecision.ALLOW:
+        execute(action)
+    elif assessment.decision == SafetyDecision.REQUIRE_CONFIRMATION:
+        if user_confirms():
+            execute(action)
+    else:  # BLOCK
+        log_blocked(assessment.reason)
+"""
+from openadapt_ml.runtime.policy import (
+    AgentPolicy,
+    PolicyOutput,
+    parse_thought_state_action,
+)
+from openadapt_ml.runtime.safety_gate import (
+    SafetyAssessment,
+    SafetyConfig,
+    SafetyDecision,
+    SafetyGate,
+)
+__all__ = [
+    # Policy
+    "AgentPolicy",
+    "PolicyOutput",
+    "parse_thought_state_action",
+    # Safety Gate
+    "SafetyGate",
+    "SafetyConfig",
+    "SafetyDecision",
+    "SafetyAssessment",
+]

openadapt-ml 0.2.0__py3-none-any.whl → 0.2.1__py3-none-any.whl

openadapt-ml 0.2.0py3-none-any.whl → 0.2.1py3-none-any.whl