PyPI - openadapt-ml - Versions diffs - 0.1.0__py3-none-any.whl - Mend

openadapt-ml 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

openadapt_ml/__init__.py +0 -0
openadapt_ml/benchmarks/__init__.py +125 -0
openadapt_ml/benchmarks/agent.py +825 -0
openadapt_ml/benchmarks/azure.py +761 -0
openadapt_ml/benchmarks/base.py +366 -0
openadapt_ml/benchmarks/cli.py +884 -0
openadapt_ml/benchmarks/data_collection.py +432 -0
openadapt_ml/benchmarks/runner.py +381 -0
openadapt_ml/benchmarks/waa.py +704 -0
openadapt_ml/cloud/__init__.py +5 -0
openadapt_ml/cloud/azure_inference.py +441 -0
openadapt_ml/cloud/lambda_labs.py +2445 -0
openadapt_ml/cloud/local.py +790 -0
openadapt_ml/config.py +56 -0
openadapt_ml/datasets/__init__.py +0 -0
openadapt_ml/datasets/next_action.py +507 -0
openadapt_ml/evals/__init__.py +23 -0
openadapt_ml/evals/grounding.py +241 -0
openadapt_ml/evals/plot_eval_metrics.py +174 -0
openadapt_ml/evals/trajectory_matching.py +486 -0
openadapt_ml/grounding/__init__.py +45 -0
openadapt_ml/grounding/base.py +236 -0
openadapt_ml/grounding/detector.py +570 -0
openadapt_ml/ingest/__init__.py +43 -0
openadapt_ml/ingest/capture.py +312 -0
openadapt_ml/ingest/loader.py +232 -0
openadapt_ml/ingest/synthetic.py +1102 -0
openadapt_ml/models/__init__.py +0 -0
openadapt_ml/models/api_adapter.py +171 -0
openadapt_ml/models/base_adapter.py +59 -0
openadapt_ml/models/dummy_adapter.py +42 -0
openadapt_ml/models/qwen_vl.py +426 -0
openadapt_ml/runtime/__init__.py +0 -0
openadapt_ml/runtime/policy.py +182 -0
openadapt_ml/schemas/__init__.py +53 -0
openadapt_ml/schemas/sessions.py +122 -0
openadapt_ml/schemas/validation.py +252 -0
openadapt_ml/scripts/__init__.py +0 -0
openadapt_ml/scripts/compare.py +1490 -0
openadapt_ml/scripts/demo_policy.py +62 -0
openadapt_ml/scripts/eval_policy.py +287 -0
openadapt_ml/scripts/make_gif.py +153 -0
openadapt_ml/scripts/prepare_synthetic.py +43 -0
openadapt_ml/scripts/run_qwen_login_benchmark.py +192 -0
openadapt_ml/scripts/train.py +174 -0
openadapt_ml/training/__init__.py +0 -0
openadapt_ml/training/benchmark_viewer.py +1538 -0
openadapt_ml/training/shared_ui.py +157 -0
openadapt_ml/training/stub_provider.py +276 -0
openadapt_ml/training/trainer.py +2446 -0
openadapt_ml/training/viewer.py +2970 -0
openadapt_ml-0.1.0.dist-info/METADATA +818 -0
openadapt_ml-0.1.0.dist-info/RECORD +55 -0
openadapt_ml-0.1.0.dist-info/WHEEL +4 -0
openadapt_ml-0.1.0.dist-info/licenses/LICENSE +21 -0

openadapt_ml/training/shared_ui.py ADDED Viewed

@@ -0,0 +1,157 @@
+"""Shared UI components for dashboards and viewers.
+This module contains CSS and HTML generation functions used by both
+the Training Dashboard and the Viewer for visual consistency.
+"""
+from __future__ import annotations
+def get_shared_header_css() -> str:
+    """Generate CSS for the shared dashboard header.
+    This CSS is used by both the Training Dashboard and the Viewer.
+    Any changes here will affect all dashboards consistently.
+    """
+    return '''
+    .unified-header {
+        display: flex;
+        align-items: center;
+        justify-content: space-between;
+        padding: 12px 24px;
+        background: linear-gradient(180deg, rgba(18,18,26,0.98) 0%, rgba(26,26,36,0.98) 100%);
+        border-bottom: 1px solid rgba(255,255,255,0.08);
+        margin-bottom: 20px;
+        gap: 16px;
+        flex-wrap: wrap;
+        box-shadow: 0 2px 8px rgba(0,0,0,0.3);
+    }
+    .unified-header .nav-tabs {
+        display: flex;
+        align-items: center;
+        gap: 4px;
+        background: rgba(0,0,0,0.3);
+        padding: 4px;
+        border-radius: 8px;
+    }
+    .unified-header .nav-tab {
+        padding: 8px 16px;
+        border-radius: 6px;
+        font-size: 0.85rem;
+        font-weight: 500;
+        text-decoration: none;
+        color: var(--text-secondary);
+        background: transparent;
+        border: none;
+        transition: all 0.2s;
+        cursor: pointer;
+    }
+    .unified-header .nav-tab:hover {
+        color: var(--text-primary);
+        background: rgba(255,255,255,0.05);
+    }
+    .unified-header .nav-tab.active {
+        color: var(--bg-primary);
+        background: var(--accent);
+        font-weight: 600;
+    }
+    .unified-header .controls-section {
+        display: flex;
+        align-items: center;
+        gap: 24px;
+        flex-wrap: wrap;
+    }
+    .unified-header .control-group {
+        display: flex;
+        align-items: center;
+        gap: 10px;
+    }
+    .unified-header .control-label {
+        font-size: 0.7rem;
+        color: var(--text-muted);
+        font-weight: 600;
+        letter-spacing: 0.5px;
+        text-transform: uppercase;
+    }
+    .unified-header select {
+        padding: 8px 32px 8px 12px;
+        border-radius: 8px;
+        font-size: 0.85rem;
+        background: rgba(0,0,0,0.4);
+        color: var(--text-primary);
+        border: 1px solid rgba(255,255,255,0.1);
+        cursor: pointer;
+        appearance: none;
+        background-image: url('data:image/svg+xml,%3Csvg xmlns=%27http://www.w3.org/2000/svg%27 width=%2712%27 height=%278%27%3E%3Cpath fill=%27%23888%27 d=%27M0 0l6 8 6-8z%27/%3E%3C/svg%3E');
+        background-repeat: no-repeat;
+        background-position: right 10px center;
+        transition: all 0.2s;
+    }
+    .unified-header select:hover {
+        border-color: var(--accent);
+        background-color: rgba(0,212,170,0.1);
+    }
+    .unified-header select:focus {
+        outline: none;
+        border-color: var(--accent);
+        box-shadow: 0 0 0 2px rgba(0,212,170,0.2);
+    }
+    .unified-header .header-meta {
+        font-size: 0.75rem;
+        color: var(--text-muted);
+        font-family: "SF Mono", Monaco, monospace;
+    }
+    '''
+def generate_shared_header_html(
+    active_page: str,
+    controls_html: str = "",
+    meta_html: str = "",
+) -> str:
+    """Generate the shared header HTML.
+    Args:
+        active_page: Either "training", "viewer", or "benchmarks" to highlight the active tab
+        controls_html: Optional HTML for control groups (dropdowns, etc.)
+        meta_html: Optional HTML for metadata display (job ID, capture ID, etc.)
+    Returns:
+        HTML string for the header
+    """
+    training_active = "active" if active_page == "training" else ""
+    viewer_active = "active" if active_page == "viewer" else ""
+    benchmarks_active = "active" if active_page == "benchmarks" else ""
+    controls_section = ""
+    if controls_html or meta_html:
+        controls_section = f'''
+        <div class="controls-section">
+            {controls_html}
+            {f'<span class="header-meta">{meta_html}</span>' if meta_html else ''}
+        </div>
+        '''
+    return f'''
+    <div class="unified-header">
+        <div class="nav-tabs">
+            <a href="dashboard.html" class="nav-tab {training_active}">Training</a>
+            <a href="viewer.html" class="nav-tab {viewer_active}">Viewer</a>
+            <a href="benchmark.html" class="nav-tab {benchmarks_active}">Benchmarks</a>
+        </div>
+        {controls_section}
+    </div>
+    '''
+def build_nav_links() -> list[tuple[str, str]]:
+    """Build navigation links for multi-capture dashboards.
+    Returns:
+        List of (filename, label) tuples
+    """
+    return [
+        ("dashboard.html", "Training"),
+        ("viewer.html", "Viewer"),
+        ("benchmark.html", "Benchmarks"),
+    ]

openadapt_ml/training/stub_provider.py ADDED Viewed

@@ -0,0 +1,276 @@
+"""Stub training provider for rapid UI testing without actual training."""
+import json
+import random
+import sys
+import time
+from datetime import datetime
+from pathlib import Path
+class StubTrainingProvider:
+    """Simulates training without actual computation.
+    Use this to test dashboard, viewer, stop button, etc. without
+    waiting for real training on GPU or Lambda.
+    """
+    def __init__(
+        self,
+        output_dir: Path,
+        epochs: int = 5,
+        steps_per_epoch: int = 10,
+        step_delay: float = 0.5,
+        early_stop_loss: float = 0.0,
+        early_stop_patience: int = 3,
+    ):
+        """Initialize stub provider.
+        Args:
+            output_dir: Directory to write training_log.json
+            epochs: Number of epochs to simulate
+            steps_per_epoch: Steps per epoch
+            step_delay: Delay between steps in seconds (for realistic feel)
+            early_stop_loss: Stop if loss drops below this threshold
+            early_stop_patience: Number of consecutive steps below threshold before stopping
+        """
+        self.output_dir = Path(output_dir)
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+        self.epochs = epochs
+        self.steps_per_epoch = steps_per_epoch
+        self.step_delay = step_delay
+        self.early_stop_loss = early_stop_loss
+        self.early_stop_patience = early_stop_patience
+        self.current_epoch = 0
+        self.current_step = 0
+        self.losses = []
+        self.evaluations = []
+        self.start_time = time.time()
+        self.job_id = f"stub_{datetime.now().strftime('%Y%m%d_%H%M%S')}"
+        self.consecutive_low_loss = 0
+        self.termination_status = None
+        self.termination_message = None
+        # Set up logging to file
+        self.log_file = self.output_dir / "training.log"
+        self.log_handle = None
+    def _log(self, message: str, to_stdout: bool = True):
+        """Write message to both log file and stdout.
+        Args:
+            message: Message to log
+            to_stdout: If True, also print to stdout (default: True)
+        """
+        timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
+        log_line = f"[{timestamp}] {message}"
+        # Write to file
+        if self.log_handle is None:
+            self.log_handle = open(self.log_file, "w", buffering=1)  # Line buffered
+        self.log_handle.write(log_line + "\n")
+        self.log_handle.flush()
+        # Print to stdout
+        if to_stdout:
+            print(message)
+    def simulate_step(self) -> dict:
+        """Simulate one training step.
+        Returns:
+            Current training status dict
+        """
+        # Generate decreasing loss with noise
+        progress = self.current_step / (self.epochs * self.steps_per_epoch)
+        base_loss = 2.5 * (1 - progress * 0.8)  # Decrease from 2.5 to ~0.5
+        noise = random.uniform(-0.15, 0.15)
+        loss = max(0.1, base_loss + noise)
+        elapsed = time.time() - self.start_time
+        self.losses.append({
+            "epoch": self.current_epoch,
+            "step": self.current_step + 1,
+            "loss": loss,
+            "lr": 5e-5,
+            "time": elapsed,
+        })
+        self.current_step += 1
+        # Check for epoch completion
+        if self.current_step % self.steps_per_epoch == 0:
+            self._generate_epoch_evaluation()
+            self.current_epoch += 1
+            # Cap at max epochs for display
+            if self.current_epoch > self.epochs:
+                self.current_epoch = self.epochs
+        return self.get_status()
+    def _generate_epoch_evaluation(self):
+        """Generate fake evaluation for completed epoch."""
+        # Improve accuracy as training progresses
+        progress = self.current_epoch / self.epochs
+        accuracy_boost = progress * 0.3  # Up to 30% improvement
+        # Use real screenshot if available, otherwise placeholder
+        sample_path = self.output_dir / "screenshots" / "sample.png"
+        if not sample_path.exists():
+            # Try to copy from common capture location
+            import shutil
+            capture_screenshots = Path.home() / "oa/src/openadapt-capture/turn-off-nightshift/screenshots"
+            if capture_screenshots.exists():
+                sample_path.parent.mkdir(parents=True, exist_ok=True)
+                for img in capture_screenshots.glob("*.png"):
+                    shutil.copy(img, sample_path)
+                    break  # Just copy the first one
+        self.evaluations.append({
+            "epoch": self.current_epoch,
+            "sample_idx": 7,  # Match the real training sample
+            "image_path": "screenshots/sample.png",
+            "human_action": {
+                "type": "click",
+                "x": 0.65,
+                "y": 0.65,
+                "text": None,
+            },
+            "predicted_action": {
+                "type": "click",
+                "x": 0.65 + random.uniform(-0.15, 0.15) * (1 - accuracy_boost),
+                "y": 0.65 + random.uniform(-0.15, 0.15) * (1 - accuracy_boost),
+                "raw_output": f"Thought: [Stub] Epoch {self.current_epoch} - analyzing screenshot to find target element. The model is learning to identify UI components.\nAction: CLICK(x=0.65, y=0.65)",
+            },
+            "distance": random.uniform(0.05, 0.2) * (1 - accuracy_boost),
+            "correct": random.random() > (0.5 - accuracy_boost),
+        })
+    def get_status(self) -> dict:
+        """Return current training status.
+        Returns:
+            Status dict compatible with training_log.json format
+        """
+        current_loss = self.losses[-1]["loss"] if self.losses else 0
+        elapsed = time.time() - self.start_time
+        # Determine status
+        if self.termination_status:
+            status = "completed" if self.termination_status == "auto_complete" else self.termination_status
+        elif self.is_complete():
+            status = "completed"
+        else:
+            status = "training"
+        return {
+            "job_id": self.job_id,
+            "hostname": "stub-local",
+            "capture_path": "/stub/capture",
+            "config_path": "configs/stub.yaml",
+            "instance_type": "stub",
+            "instance_ip": "127.0.0.1",
+            "started_at": datetime.fromtimestamp(self.start_time).isoformat() + "Z",
+            "cloud_provider": "stub",
+            "cloud_dashboard_url": "",
+            "cloud_instance_id": "stub",
+            "setup_status": "training",
+            "setup_logs": ["[Stub] Simulated training in progress..."],
+            "epoch": self.current_epoch,
+            "step": self.current_step,
+            "total_steps": self.epochs * self.steps_per_epoch,
+            "total_epochs": self.epochs,
+            "loss": current_loss,
+            "learning_rate": 5e-5,
+            "samples_seen": self.current_step,
+            "elapsed_time": elapsed,
+            "losses": self.losses,
+            "evaluations": self.evaluations,
+            "status": status,
+            "termination_status": self.termination_status,
+            "termination_message": self.termination_message,
+        }
+    def write_status(self):
+        """Write current status to training_log.json."""
+        log_path = self.output_dir / "training_log.json"
+        log_path.write_text(json.dumps(self.get_status(), indent=2))
+    def is_complete(self) -> bool:
+        """Check if training simulation is complete."""
+        return self.current_epoch >= self.epochs
+    def check_stop_signal(self) -> bool:
+        """Check if stop signal file exists."""
+        stop_file = self.output_dir / "STOP_TRAINING"
+        return stop_file.exists()
+    def run(self, callback=None):
+        """Run the full training simulation.
+        Args:
+            callback: Optional function called after each step with status dict
+        """
+        self._log(f"[Stub] Starting simulated training: {self.epochs} epochs, {self.steps_per_epoch} steps/epoch")
+        self._log(f"[Stub] Output: {self.output_dir}")
+        self._log(f"[Stub] Step delay: {self.step_delay}s (total ~{self.epochs * self.steps_per_epoch * self.step_delay:.0f}s)")
+        if self.early_stop_loss > 0:
+            self._log(f"[Stub] Early stop: loss < {self.early_stop_loss} for {self.early_stop_patience} steps")
+        self._log("")
+        while not self.is_complete():
+            # Check for user stop signal
+            if self.check_stop_signal():
+                self._log("\n[Stub] Stop signal received from user!")
+                (self.output_dir / "STOP_TRAINING").unlink(missing_ok=True)
+                self.termination_status = "user_stop"
+                self.termination_message = f"Stopped at epoch {self.current_epoch + 1}, step {self.current_step}"
+                self.write_status()
+                break
+            status = self.simulate_step()
+            # Check for early stop loss
+            loss = status["loss"]
+            if self.early_stop_loss > 0 and loss < self.early_stop_loss:
+                self.consecutive_low_loss += 1
+                if self.consecutive_low_loss >= self.early_stop_patience:
+                    self._log(f"\n[Stub] Auto-stopped: loss ({loss:.4f}) < {self.early_stop_loss} for {self.early_stop_patience} steps")
+                    self.termination_status = "auto_low_loss"
+                    self.termination_message = f"Loss reached {loss:.4f} (< {self.early_stop_loss})"
+                    self.write_status()
+                    break
+            else:
+                self.consecutive_low_loss = 0
+            self.write_status()
+            # Progress output
+            epoch = status["epoch"]
+            step = status["step"]
+            display_epoch = min(epoch + 1, self.epochs)  # Cap at max for display
+            self._log(f"  Epoch {display_epoch}/{self.epochs} | Step {step} | Loss: {loss:.4f}")
+            if callback:
+                callback(status)
+            time.sleep(self.step_delay)
+        # Set completion status if not already set
+        if self.termination_status is None:
+            self.termination_status = "auto_complete"
+            self.termination_message = f"Completed {self.epochs} epochs"
+            self.write_status()
+        self._log(f"\n[Stub] Training complete: {self.termination_status}")
+        # Close log file
+        if self.log_handle:
+            self.log_handle.close()
+            self.log_handle = None
+        return self.get_status()