PyPI - openadapt-capture - Versions diffs - 0.1.0__tar.gz - Mend

openadapt-capture 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

openadapt_capture-0.1.0/.env.example +7 -0
openadapt_capture-0.1.0/.github/workflows/publish.yml +30 -0
openadapt_capture-0.1.0/.github/workflows/test.yml +55 -0
openadapt_capture-0.1.0/.gitignore +53 -0
openadapt_capture-0.1.0/PKG-INFO +227 -0
openadapt_capture-0.1.0/README.md +183 -0
openadapt_capture-0.1.0/docs/DESIGN.md +276 -0
openadapt_capture-0.1.0/docs/VISUALIZATION_DESIGN.md +156 -0
openadapt_capture-0.1.0/docs/images/codec_comparison.png +0 -0
openadapt_capture-0.1.0/docs/images/demo.gif +0 -0
openadapt_capture-0.1.0/docs/images/frame_comparison.png +0 -0
openadapt_capture-0.1.0/docs/images/performance_stats.png +0 -0
openadapt_capture-0.1.0/docs/images/viewer.html +602 -0
openadapt_capture-0.1.0/openadapt_capture/__init__.py +140 -0
openadapt_capture-0.1.0/openadapt_capture/audio.py +489 -0
openadapt_capture-0.1.0/openadapt_capture/capture.py +300 -0
openadapt_capture-0.1.0/openadapt_capture/cli.py +289 -0
openadapt_capture-0.1.0/openadapt_capture/comparison.py +276 -0
openadapt_capture-0.1.0/openadapt_capture/config.py +29 -0
openadapt_capture-0.1.0/openadapt_capture/events.py +280 -0
openadapt_capture-0.1.0/openadapt_capture/input.py +494 -0
openadapt_capture-0.1.0/openadapt_capture/processing.py +548 -0
openadapt_capture-0.1.0/openadapt_capture/recorder.py +304 -0
openadapt_capture-0.1.0/openadapt_capture/stats.py +212 -0
openadapt_capture-0.1.0/openadapt_capture/storage.py +617 -0
openadapt_capture-0.1.0/openadapt_capture/video.py +440 -0
openadapt_capture-0.1.0/openadapt_capture/visualize/__init__.py +11 -0
openadapt_capture-0.1.0/openadapt_capture/visualize/demo.py +343 -0
openadapt_capture-0.1.0/openadapt_capture/visualize/html.py +1538 -0
openadapt_capture-0.1.0/openadapt_capture/visualize/overlays.py +469 -0
openadapt_capture-0.1.0/pyproject.toml +91 -0
openadapt_capture-0.1.0/scripts/compare_codecs.py +369 -0
openadapt_capture-0.1.0/scripts/generate_readme_demo.py +167 -0
openadapt_capture-0.1.0/scripts/generate_readme_plots.py +232 -0
openadapt_capture-0.1.0/scripts/generate_real_capture_plot.py +217 -0
openadapt_capture-0.1.0/tests/__init__.py +1 -0
openadapt_capture-0.1.0/tests/test_comparison.py +225 -0
openadapt_capture-0.1.0/tests/test_events.py +273 -0
openadapt_capture-0.1.0/tests/test_highlevel.py +172 -0
openadapt_capture-0.1.0/tests/test_processing.py +254 -0
openadapt_capture-0.1.0/tests/test_processing_comprehensive.py +454 -0
openadapt_capture-0.1.0/tests/test_stats.py +261 -0
openadapt_capture-0.1.0/tests/test_storage.py +275 -0

openadapt_capture-0.1.0/.env.example ADDED Viewed

@@ -0,0 +1,7 @@
+# OpenAI API key (optional)
+# Only needed for fast cloud-based audio transcription via: capture transcribe <dir> --api
+# Without this key, you can still use local Whisper transcription: capture transcribe <dir>
+# Recording works without any API key.
+#
+# Get your key at: https://platform.openai.com/api-keys
+OPENAI_API_KEY=sk-...

openadapt_capture-0.1.0/.github/workflows/publish.yml ADDED Viewed

@@ -0,0 +1,30 @@
+name: Publish to PyPI
+on:
+  push:
+    tags:
+      - 'v*'
+jobs:
+  publish:
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write  # Required for trusted publishing
+      contents: read   # Required for checkout
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+        with:
+          version: "latest"
+      - name: Set up Python
+        run: uv python install 3.12
+      - name: Build package
+        run: uv build
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1

openadapt_capture-0.1.0/.github/workflows/test.yml ADDED Viewed

@@ -0,0 +1,55 @@
+name: Tests
+on:
+  push:
+    branches: [main]
+  pull_request:
+    branches: [main]
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.10", "3.11", "3.12"]
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+        with:
+          version: "latest"
+      - name: Set up Python ${{ matrix.python-version }}
+        run: uv python install ${{ matrix.python-version }}
+      - name: Install system dependencies
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y ffmpeg libportaudio2
+      - name: Install dependencies
+        run: uv sync --extra dev
+      - name: Run tests
+        run: uv run pytest tests/ -v
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+        with:
+          version: "latest"
+      - name: Set up Python
+        run: uv python install 3.12
+      - name: Install dependencies
+        run: uv sync --extra dev
+      - name: Run ruff
+        run: uv run ruff check openadapt_capture/

openadapt_capture-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,53 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+# Virtual environments
+.venv/
+venv/
+ENV/
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+.nox/
+# IDEs
+.idea/
+.vscode/
+*.swp
+*.swo
+*~
+# OS
+.DS_Store
+Thumbs.db
+# uv
+uv.lock
+# Environment variables (contains API keys)
+.env
+# Demo captures (large data files)
+demo_*/

openadapt_capture-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,227 @@
+Metadata-Version: 2.4
+Name: openadapt-capture
+Version: 0.1.0
+Summary: GUI interaction capture - platform-agnostic event streams with time-aligned media
+Project-URL: Homepage, https://github.com/OpenAdaptAI/openadapt-capture
+Project-URL: Repository, https://github.com/OpenAdaptAI/openadapt-capture
+Author-email: "MLDSAI Inc." <richard@mldsai.com>
+License-Expression: MIT
+Keywords: automation,capture,events,gui,rpa
+Classifier: Development Status :: 2 - Pre-Alpha
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Requires-Python: >=3.10
+Requires-Dist: av>=10.0.0
+Requires-Dist: fire>=0.7.1
+Requires-Dist: mss>=6.0.0
+Requires-Dist: openai-whisper>=20250625
+Requires-Dist: openai>=2.11.0
+Requires-Dist: pillow>=9.0.0
+Requires-Dist: pydantic-settings>=2.12.0
+Requires-Dist: pydantic>=2.0.0
+Requires-Dist: pynput>=1.7.0
+Requires-Dist: sounddevice>=0.5.3
+Requires-Dist: soundfile>=0.13.1
+Provides-Extra: all
+Requires-Dist: openadapt-privacy>=0.1.0; extra == 'all'
+Requires-Dist: openai-whisper>=20230314; extra == 'all'
+Provides-Extra: dev
+Requires-Dist: matplotlib>=3.5.0; extra == 'dev'
+Requires-Dist: numpy>=1.21.0; extra == 'dev'
+Requires-Dist: pytest-cov>=4.0.0; extra == 'dev'
+Requires-Dist: pytest>=7.0.0; extra == 'dev'
+Requires-Dist: ruff>=0.1.0; extra == 'dev'
+Provides-Extra: privacy
+Requires-Dist: openadapt-privacy>=0.1.0; extra == 'privacy'
+Provides-Extra: transcribe
+Requires-Dist: openai-whisper>=20230314; extra == 'transcribe'
+Description-Content-Type: text/markdown
+# openadapt-capture
+GUI interaction capture - platform-agnostic event streams with time-aligned media.
+> **Status:** Pre-alpha. See [docs/DESIGN.md](docs/DESIGN.md) for architecture discussion.
+## Installation
+```bash
+uv add openadapt-capture
+```
+This includes everything needed to capture and replay GUI interactions (mouse, keyboard, screen recording).
+For audio capture with Whisper transcription (large download):
+```bash
+uv add "openadapt-capture[audio]"
+```
+## Quick Start
+### Capture
+```python
+from openadapt_capture import Recorder
+# Record GUI interactions
+with Recorder("./my_capture", task_description="Demo task") as recorder:
+    # Captures mouse, keyboard, and screen until context exits
+    input("Press Enter to stop recording...")
+print(f"Captured {recorder.event_count} events")
+```
+### Replay / Analysis
+```python
+from openadapt_capture import Capture
+# Load and iterate over time-aligned events
+capture = Capture.load("./my_capture")
+for action in capture.actions():
+    # Each action has an associated screenshot
+    print(f"{action.timestamp}: {action.type} at ({action.x}, {action.y})")
+    screenshot = action.screenshot  # PIL Image at time of action
+```
+### Low-Level API
+```python
+from openadapt_capture import (
+    create_capture, process_events,
+    MouseDownEvent, MouseButton,
+)
+# Create storage (platform and screen size auto-detected)
+capture, storage = create_capture("./my_capture")
+# Write raw events
+storage.write_event(MouseDownEvent(timestamp=1.0, x=100, y=200, button=MouseButton.LEFT))
+# Query and process
+raw_events = storage.get_events()
+actions = process_events(raw_events)  # Merges clicks, drags, typed text
+```
+## Event Types
+**Raw events** (captured):
+- `mouse.move`, `mouse.down`, `mouse.up`, `mouse.scroll`
+- `key.down`, `key.up`
+- `screen.frame`, `audio.chunk`
+**Actions** (processed):
+- `mouse.singleclick`, `mouse.doubleclick`, `mouse.drag`
+- `key.type` (merged keystrokes → text)
+## Architecture
+```
+capture_directory/
+├── capture.db      # SQLite: events, metadata
+├── video.mp4       # Screen recording
+└── audio.flac      # Audio (optional)
+```
+## Performance Statistics
+Track event write latency and analyze capture performance:
+```python
+from openadapt_capture import Recorder
+with Recorder("./my_capture") as recorder:
+    input("Press Enter to stop...")
+# Access performance statistics
+summary = recorder.stats.summary()
+print(f"Mean latency: {summary['mean_latency_ms']:.1f}ms")
+# Generate performance plot
+recorder.stats.plot(output_path="performance.png")
+```
+![Performance Statistics](docs/images/performance_stats.png)
+## Frame Extraction Verification
+Compare extracted video frames against original images to verify lossless capture:
+```python
+from openadapt_capture import compare_video_to_images, plot_comparison
+# Compare frames
+report = compare_video_to_images(
+    "capture/video.mp4",
+    [(timestamp, image) for timestamp, image in captured_frames],
+)
+print(f"Mean diff: {report.mean_diff_overall:.2f}")
+print(f"Lossless: {report.is_lossless}")
+# Visualize comparison
+plot_comparison(report, output_path="comparison.png")
+```
+![Frame Comparison](docs/images/frame_comparison.png)
+## Visualization
+Generate animated demos and interactive viewers from recordings:
+### Animated GIF Demo
+```python
+from openadapt_capture import Capture, create_demo
+capture = Capture.load("./my_capture")
+create_demo(capture, output="demo.gif", fps=10, max_duration=15)
+```
+### Interactive HTML Viewer
+```python
+from openadapt_capture import Capture, create_html
+capture = Capture.load("./my_capture")
+create_html(capture, output="viewer.html", include_audio=True)
+```
+The HTML viewer includes:
+- Timeline scrubber with event markers
+- Frame-by-frame navigation
+- Synchronized audio playback
+- Event list with details panel
+- Keyboard shortcuts (Space, arrows, Home/End)
+### Generate Demo from Command Line
+```bash
+uv run python scripts/generate_readme_demo.py --duration 10
+```
+## Optional Extras
+| Extra | Features |
+|-------|----------|
+| `audio` | Audio capture + Whisper transcription |
+| `privacy` | PII scrubbing (openadapt-privacy) |
+| `all` | Everything |
+## Development
+```bash
+uv sync --dev
+uv run pytest
+```
+## License
+MIT

openadapt_capture-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,183 @@
+# openadapt-capture
+GUI interaction capture - platform-agnostic event streams with time-aligned media.
+> **Status:** Pre-alpha. See [docs/DESIGN.md](docs/DESIGN.md) for architecture discussion.
+## Installation
+```bash
+uv add openadapt-capture
+```
+This includes everything needed to capture and replay GUI interactions (mouse, keyboard, screen recording).
+For audio capture with Whisper transcription (large download):
+```bash
+uv add "openadapt-capture[audio]"
+```
+## Quick Start
+### Capture
+```python
+from openadapt_capture import Recorder
+# Record GUI interactions
+with Recorder("./my_capture", task_description="Demo task") as recorder:
+    # Captures mouse, keyboard, and screen until context exits
+    input("Press Enter to stop recording...")
+print(f"Captured {recorder.event_count} events")
+```
+### Replay / Analysis
+```python
+from openadapt_capture import Capture
+# Load and iterate over time-aligned events
+capture = Capture.load("./my_capture")
+for action in capture.actions():
+    # Each action has an associated screenshot
+    print(f"{action.timestamp}: {action.type} at ({action.x}, {action.y})")
+    screenshot = action.screenshot  # PIL Image at time of action
+```
+### Low-Level API
+```python
+from openadapt_capture import (
+    create_capture, process_events,
+    MouseDownEvent, MouseButton,
+)
+# Create storage (platform and screen size auto-detected)
+capture, storage = create_capture("./my_capture")
+# Write raw events
+storage.write_event(MouseDownEvent(timestamp=1.0, x=100, y=200, button=MouseButton.LEFT))
+# Query and process
+raw_events = storage.get_events()
+actions = process_events(raw_events)  # Merges clicks, drags, typed text
+```
+## Event Types
+**Raw events** (captured):
+- `mouse.move`, `mouse.down`, `mouse.up`, `mouse.scroll`
+- `key.down`, `key.up`
+- `screen.frame`, `audio.chunk`
+**Actions** (processed):
+- `mouse.singleclick`, `mouse.doubleclick`, `mouse.drag`
+- `key.type` (merged keystrokes → text)
+## Architecture
+```
+capture_directory/
+├── capture.db      # SQLite: events, metadata
+├── video.mp4       # Screen recording
+└── audio.flac      # Audio (optional)
+```
+## Performance Statistics
+Track event write latency and analyze capture performance:
+```python
+from openadapt_capture import Recorder
+with Recorder("./my_capture") as recorder:
+    input("Press Enter to stop...")
+# Access performance statistics
+summary = recorder.stats.summary()
+print(f"Mean latency: {summary['mean_latency_ms']:.1f}ms")
+# Generate performance plot
+recorder.stats.plot(output_path="performance.png")
+```
+![Performance Statistics](docs/images/performance_stats.png)
+## Frame Extraction Verification
+Compare extracted video frames against original images to verify lossless capture:
+```python
+from openadapt_capture import compare_video_to_images, plot_comparison
+# Compare frames
+report = compare_video_to_images(
+    "capture/video.mp4",
+    [(timestamp, image) for timestamp, image in captured_frames],
+)
+print(f"Mean diff: {report.mean_diff_overall:.2f}")
+print(f"Lossless: {report.is_lossless}")
+# Visualize comparison
+plot_comparison(report, output_path="comparison.png")
+```
+![Frame Comparison](docs/images/frame_comparison.png)
+## Visualization
+Generate animated demos and interactive viewers from recordings:
+### Animated GIF Demo
+```python
+from openadapt_capture import Capture, create_demo
+capture = Capture.load("./my_capture")
+create_demo(capture, output="demo.gif", fps=10, max_duration=15)
+```
+### Interactive HTML Viewer
+```python
+from openadapt_capture import Capture, create_html
+capture = Capture.load("./my_capture")
+create_html(capture, output="viewer.html", include_audio=True)
+```
+The HTML viewer includes:
+- Timeline scrubber with event markers
+- Frame-by-frame navigation
+- Synchronized audio playback
+- Event list with details panel
+- Keyboard shortcuts (Space, arrows, Home/End)
+### Generate Demo from Command Line
+```bash
+uv run python scripts/generate_readme_demo.py --duration 10
+```
+## Optional Extras
+| Extra | Features |
+|-------|----------|
+| `audio` | Audio capture + Whisper transcription |
+| `privacy` | PII scrubbing (openadapt-privacy) |
+| `all` | Everything |
+## Development
+```bash
+uv sync --dev
+uv run pytest
+```
+## License
+MIT