PyPI - media-engine - Versions diffs - 0.1.0__py3-none-any.whl - Mend

media-engine 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

cli/clip.py +79 -0
cli/faces.py +91 -0
cli/metadata.py +68 -0
cli/motion.py +77 -0
cli/objects.py +94 -0
cli/ocr.py +93 -0
cli/scenes.py +57 -0
cli/telemetry.py +65 -0
cli/transcript.py +76 -0
media_engine/__init__.py +7 -0
media_engine/_version.py +34 -0
media_engine/app.py +80 -0
media_engine/batch/__init__.py +56 -0
media_engine/batch/models.py +99 -0
media_engine/batch/processor.py +1131 -0
media_engine/batch/queue.py +232 -0
media_engine/batch/state.py +30 -0
media_engine/batch/timing.py +321 -0
media_engine/cli.py +17 -0
media_engine/config.py +674 -0
media_engine/extractors/__init__.py +75 -0
media_engine/extractors/clip.py +401 -0
media_engine/extractors/faces.py +459 -0
media_engine/extractors/frame_buffer.py +351 -0
media_engine/extractors/frames.py +402 -0
media_engine/extractors/metadata/__init__.py +127 -0
media_engine/extractors/metadata/apple.py +169 -0
media_engine/extractors/metadata/arri.py +118 -0
media_engine/extractors/metadata/avchd.py +208 -0
media_engine/extractors/metadata/avchd_gps.py +270 -0
media_engine/extractors/metadata/base.py +688 -0
media_engine/extractors/metadata/blackmagic.py +139 -0
media_engine/extractors/metadata/camera_360.py +276 -0
media_engine/extractors/metadata/canon.py +290 -0
media_engine/extractors/metadata/dji.py +371 -0
media_engine/extractors/metadata/dv.py +121 -0
media_engine/extractors/metadata/ffmpeg.py +76 -0
media_engine/extractors/metadata/generic.py +119 -0
media_engine/extractors/metadata/gopro.py +256 -0
media_engine/extractors/metadata/red.py +305 -0
media_engine/extractors/metadata/registry.py +114 -0
media_engine/extractors/metadata/sony.py +442 -0
media_engine/extractors/metadata/tesla.py +157 -0
media_engine/extractors/motion.py +765 -0
media_engine/extractors/objects.py +245 -0
media_engine/extractors/objects_qwen.py +754 -0
media_engine/extractors/ocr.py +268 -0
media_engine/extractors/scenes.py +82 -0
media_engine/extractors/shot_type.py +217 -0
media_engine/extractors/telemetry.py +262 -0
media_engine/extractors/transcribe.py +579 -0
media_engine/extractors/translate.py +121 -0
media_engine/extractors/vad.py +263 -0
media_engine/main.py +68 -0
media_engine/py.typed +0 -0
media_engine/routers/__init__.py +15 -0
media_engine/routers/batch.py +78 -0
media_engine/routers/health.py +93 -0
media_engine/routers/models.py +211 -0
media_engine/routers/settings.py +87 -0
media_engine/routers/utils.py +135 -0
media_engine/schemas.py +581 -0
media_engine/utils/__init__.py +5 -0
media_engine/utils/logging.py +54 -0
media_engine/utils/memory.py +49 -0
media_engine-0.1.0.dist-info/METADATA +276 -0
media_engine-0.1.0.dist-info/RECORD +70 -0
media_engine-0.1.0.dist-info/WHEEL +4 -0
media_engine-0.1.0.dist-info/entry_points.txt +11 -0
media_engine-0.1.0.dist-info/licenses/LICENSE +21 -0

media_engine/batch/queue.py ADDED Viewed

@@ -0,0 +1,232 @@
+"""Queue management for batch processing."""
+from __future__ import annotations
+import logging
+import threading
+from datetime import datetime, timezone
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from media_engine.batch.models import BatchRequest
+from media_engine.batch.models import JOB_TTL_SECONDS
+from media_engine.batch.state import (
+    batch_jobs,
+    batch_jobs_lock,
+    batch_queue,
+    batch_queue_lock,
+    set_batch_running,
+)
+logger = logging.getLogger(__name__)
+def cleanup_expired_batch_jobs() -> int:
+    """Remove completed/failed batch jobs older than TTL.
+    Returns:
+        Number of batch jobs removed
+    """
+    now = datetime.now(timezone.utc)
+    removed = 0
+    with batch_jobs_lock:
+        expired = [
+            bid
+            for bid, batch in batch_jobs.items()
+            if batch.status in ("completed", "failed") and batch.completed_at is not None and (now - batch.completed_at).total_seconds() > JOB_TTL_SECONDS
+        ]
+        for bid in expired:
+            del batch_jobs[bid]
+            removed += 1
+    if removed > 0:
+        logger.info(f"Cleaned up {removed} expired batch jobs")
+    return removed
+def update_queue_positions() -> None:
+    """Update queue_position for all queued batches."""
+    with batch_queue_lock:
+        with batch_jobs_lock:
+            for i, (bid, _) in enumerate(batch_queue):
+                if bid in batch_jobs:
+                    batch_jobs[bid].queue_position = i + 1  # 1-indexed
+def start_next_batch() -> None:
+    """Start the next batch from the queue if one exists.
+    Called when a batch completes or fails. Sets batch_running = False
+    if no more batches in queue.
+    """
+    from media_engine.batch.processor import run_batch_job
+    with batch_queue_lock:
+        if not batch_queue:
+            set_batch_running(False)
+            logger.info("Batch queue empty, no more batches to run")
+            return
+        # Pop the next batch from queue
+        next_batch_id, next_request = batch_queue.pop(0)
+        logger.info(f"Starting next batch from queue: {next_batch_id}")
+    # Update queue positions for remaining batches
+    update_queue_positions()
+    # Update batch status from queued to pending
+    with batch_jobs_lock:
+        if next_batch_id in batch_jobs:
+            batch_jobs[next_batch_id].status = "pending"
+            batch_jobs[next_batch_id].queue_position = None
+    # Start the batch in a new thread
+    thread = threading.Thread(target=run_batch_job, args=(next_batch_id, next_request))
+    thread.start()
+def create_batch_sync(batch_id: str, request: BatchRequest) -> tuple[bool, int | None, str]:
+    """Synchronous helper to create batch (runs in thread pool).
+    Returns:
+        (should_start, queue_position, status)
+    """
+    from pathlib import Path
+    from media_engine.batch.models import BatchFileStatus, BatchJobStatus
+    from media_engine.batch.state import is_batch_running, set_batch_running
+    # Cleanup expired batch jobs
+    cleanup_expired_batch_jobs()
+    # Check if we should start immediately or queue
+    with batch_queue_lock:
+        should_start = not is_batch_running()
+        if should_start:
+            set_batch_running(True)
+            queue_position = None
+            status = "pending"
+            logger.info(f"Starting batch {batch_id} immediately (no batch running)")
+        else:
+            # Add to queue
+            batch_queue.append((batch_id, request))
+            queue_position = len(batch_queue)
+            status = "queued"
+            logger.info(f"Queued batch {batch_id} at position {queue_position}")
+    # Build initial extractor status for each file
+    # Order matches processing order in run_batch_job
+    # frame_decode is enabled if any visual extractor needs it
+    frame_decode_needed = any(
+        [
+            request.enable_objects,
+            request.enable_faces,
+            request.enable_ocr,
+            request.enable_clip,
+        ]
+    )
+    extractor_flags = [
+        ("metadata", request.enable_metadata),
+        ("telemetry", True),  # Always runs
+        ("vad", request.enable_vad),
+        ("motion", request.enable_motion),
+        ("scenes", request.enable_scenes),
+        ("frame_decode", frame_decode_needed),
+        ("objects", request.enable_objects),
+        ("faces", request.enable_faces),
+        ("ocr", request.enable_ocr),
+        ("clip", request.enable_clip),
+        ("visual", request.enable_visual),
+        ("transcript", request.enable_transcript),
+    ]
+    initial_extractor_status = {name: "pending" if enabled else "skipped" for name, enabled in extractor_flags}
+    batch = BatchJobStatus(
+        batch_id=batch_id,
+        status=status,
+        queue_position=queue_position,
+        files=[
+            BatchFileStatus(
+                file=f,
+                filename=Path(f).name,
+                status="pending",
+                extractor_status=initial_extractor_status.copy(),
+            )
+            for f in request.files
+        ],
+        created_at=datetime.now(timezone.utc),
+    )
+    with batch_jobs_lock:
+        batch_jobs[batch_id] = batch
+    return should_start, queue_position, status
+def get_batch_sync(batch_id: str, status_only: bool = False):
+    """Synchronous helper to get batch status (runs in thread pool).
+    Args:
+        batch_id: The batch ID to look up
+        status_only: If True, return status/progress without large result data
+    """
+    from media_engine.batch.models import BatchFileStatus, BatchJobStatus
+    with batch_jobs_lock:
+        batch = batch_jobs.get(batch_id)
+        if batch is None:
+            return None
+        if status_only:
+            # Return a copy with results stripped out (keep status, progress, timings)
+            return BatchJobStatus(
+                batch_id=batch.batch_id,
+                status=batch.status,
+                queue_position=batch.queue_position,
+                current_extractor=batch.current_extractor,
+                progress=batch.progress,
+                files=[
+                    BatchFileStatus(
+                        file=f.file,
+                        filename=f.filename,
+                        status=f.status,
+                        results={},  # Empty - no large data
+                        error=f.error,
+                        timings=f.timings,
+                        extractor_status=f.extractor_status,
+                    )
+                    for f in batch.files
+                ],
+                created_at=batch.created_at,
+                completed_at=batch.completed_at,
+                extractor_timings=batch.extractor_timings,
+                elapsed_seconds=batch.elapsed_seconds,
+                memory_mb=batch.memory_mb,
+                peak_memory_mb=batch.peak_memory_mb,
+            )
+        return batch
+def delete_batch_sync(batch_id: str) -> tuple[bool, bool]:
+    """Synchronous helper to delete batch (runs in thread pool).
+    Returns:
+        (found, was_queued) - whether batch was found and if it was queued
+    """
+    with batch_jobs_lock:
+        if batch_id not in batch_jobs:
+            return False, False
+        was_queued = batch_jobs[batch_id].status == "queued"
+        del batch_jobs[batch_id]
+    # If it was queued, remove from queue and update positions
+    if was_queued:
+        with batch_queue_lock:
+            batch_queue[:] = [(bid, req) for bid, req in batch_queue if bid != batch_id]
+        update_queue_positions()
+    return True, was_queued

media_engine/batch/state.py ADDED Viewed

@@ -0,0 +1,30 @@
+"""Global state for batch processing."""
+from __future__ import annotations
+import threading
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from media_engine.batch.models import BatchJobStatus, BatchRequest
+# In-memory batch store
+batch_jobs: dict[str, BatchJobStatus] = {}
+batch_jobs_lock = threading.Lock()
+# Batch queue - only one batch runs at a time, others wait in queue
+batch_queue: list[tuple[str, BatchRequest]] = []  # (batch_id, request) tuples
+batch_queue_lock = threading.Lock()
+# Use mutable container for batch_running state
+_batch_state = {"running": False}
+def is_batch_running() -> bool:
+    """Check if a batch is currently running."""
+    return _batch_state["running"]
+def set_batch_running(value: bool) -> None:
+    """Set the batch running state."""
+    _batch_state["running"] = value

media_engine/batch/timing.py ADDED Viewed

@@ -0,0 +1,321 @@
+"""ETA prediction system for batch processing."""
+from __future__ import annotations
+import json
+import logging
+import threading
+import time
+from pathlib import Path
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from media_engine.batch.models import BatchRequest
+logger = logging.getLogger(__name__)
+# Historical timing data for ETA predictions
+# Key: (extractor, resolution_bucket) -> list of processing times in seconds
+_timing_history: dict[tuple[str, str], list[float]] = {}
+_timing_history_lock = threading.Lock()
+_timing_history_dirty = False  # Track if we need to save
+_timing_history_last_save = 0.0  # Last save timestamp
+# Keep last N samples per bucket for rolling average
+_MAX_TIMING_SAMPLES = 20
+# Timing history persistence
+_TIMING_HISTORY_FILE = Path.home() / ".config" / "polybos" / "timing_history.json"
+_TIMING_SAVE_INTERVAL = 30.0  # Save at most every 30 seconds
+def load_timing_history() -> None:
+    """Load timing history from disk on startup."""
+    global _timing_history
+    if not _TIMING_HISTORY_FILE.exists():
+        return
+    try:
+        with open(_TIMING_HISTORY_FILE) as f:
+            data = json.load(f)
+        # Convert string keys back to tuples
+        with _timing_history_lock:
+            for key_str, values in data.items():
+                # Key format: "extractor|resolution"
+                parts = key_str.split("|")
+                if len(parts) == 2:
+                    _timing_history[(parts[0], parts[1])] = values[-_MAX_TIMING_SAMPLES:]
+        logger.info(f"Loaded timing history: {len(_timing_history)} buckets")
+    except Exception as e:
+        logger.warning(f"Failed to load timing history: {e}")
+def save_timing_history() -> None:
+    """Save timing history to disk."""
+    global _timing_history_dirty, _timing_history_last_save
+    with _timing_history_lock:
+        if not _timing_history:
+            return
+        # Convert tuple keys to strings for JSON
+        data = {f"{k[0]}|{k[1]}": v for k, v in _timing_history.items()}
+    try:
+        _TIMING_HISTORY_FILE.parent.mkdir(parents=True, exist_ok=True)
+        with open(_TIMING_HISTORY_FILE, "w") as f:
+            json.dump(data, f, indent=2)
+        _timing_history_dirty = False
+        _timing_history_last_save = time.time()
+        logger.debug(f"Saved timing history: {len(data)} buckets")
+    except Exception as e:
+        logger.warning(f"Failed to save timing history: {e}")
+def get_resolution_bucket(width: int | None, height: int | None) -> str:
+    """Get resolution bucket for timing predictions."""
+    if width is None or height is None:
+        return "unknown"
+    pixels = width * height
+    if pixels <= 921600:  # 1280x720
+        return "720p"
+    elif pixels <= 2073600:  # 1920x1080
+        return "1080p"
+    elif pixels <= 3686400:  # 2560x1440
+        return "1440p"
+    elif pixels <= 8294400:  # 3840x2160
+        return "4k"
+    elif pixels <= 14745600:  # 5120x2880
+        return "5k"
+    else:
+        return "8k+"
+def record_timing(
+    extractor: str,
+    resolution_bucket: str,
+    seconds: float,
+    units: float | None = None,
+) -> None:
+    """Record processing rate for future ETA predictions.
+    Args:
+        extractor: Name of the extractor (transcript, visual, objects, etc.)
+        resolution_bucket: Resolution category (720p, 1080p, 4k, etc.)
+        seconds: Wall clock time to process
+        units: Normalization units - depends on extractor:
+            - transcript: duration in minutes (stores seconds per minute)
+            - visual: number of timestamps (stores seconds per timestamp)
+            - objects/faces/ocr/clip: number of frames (stores seconds per frame)
+            - If None, stores raw seconds (for metadata, telemetry, etc.)
+    """
+    global _timing_history_dirty
+    # Calculate rate (seconds per unit) or use raw seconds
+    if units and units > 0:
+        rate = seconds / units
+    else:
+        rate = seconds
+    key = (extractor, resolution_bucket)
+    with _timing_history_lock:
+        if key not in _timing_history:
+            _timing_history[key] = []
+        _timing_history[key].append(rate)
+        # Keep only recent samples
+        if len(_timing_history[key]) > _MAX_TIMING_SAMPLES:
+            _timing_history[key] = _timing_history[key][-_MAX_TIMING_SAMPLES:]
+        sample_count = len(_timing_history[key])
+        avg = sum(_timing_history[key]) / sample_count
+        _timing_history_dirty = True
+        unit_label = "/unit" if units else "s"
+        logger.debug(f"Recorded timing: {extractor}@{resolution_bucket} = {rate:.2f}{unit_label} " f"(avg: {avg:.2f}{unit_label} from {sample_count} samples)")
+    # Save periodically (not on every update to reduce disk I/O)
+    if _timing_history_dirty and time.time() - _timing_history_last_save > _TIMING_SAVE_INTERVAL:
+        save_timing_history()
+def get_predicted_rate(extractor: str, resolution_bucket: str) -> float | None:
+    """Get predicted processing rate based on historical data.
+    Returns the average rate (seconds per unit) for the given extractor and resolution.
+    Multiply by the number of units to get predicted time.
+    """
+    key = (extractor, resolution_bucket)
+    with _timing_history_lock:
+        if key in _timing_history and _timing_history[key]:
+            return sum(_timing_history[key]) / len(_timing_history[key])
+    return None
+# Default processing rates (seconds per unit) when no historical data
+# Used as fallback for ETA predictions
+DEFAULT_RATES: dict[str, float] = {
+    "metadata": 1.0,  # ~1 second per file
+    "telemetry": 0.5,  # ~0.5 seconds per file
+    "vad": 0.5,  # ~0.5 seconds per minute of video
+    # Sub-extractors within visual_processing (per frame rates)
+    "motion": 0.5,  # ~0.5 seconds per file (analyzes whole video)
+    "scenes": 0.3,  # ~0.3 seconds per file
+    "frame_decode": 0.05,  # ~0.05 seconds per frame
+    "objects": 0.3,  # ~0.3 seconds per frame (YOLO)
+    "faces": 0.2,  # ~0.2 seconds per frame
+    "ocr": 0.3,  # ~0.3 seconds per frame
+    "clip": 0.15,  # ~0.15 seconds per frame
+    # Separate stages
+    "visual": 5.0,  # ~5 seconds per timestamp (Qwen VLM is slow)
+    "transcript": 3.0,  # ~3 seconds per minute of video
+}
+# Extractor processing order - must match run_batch_job()
+EXTRACTOR_ORDER = [
+    "metadata",
+    "telemetry",
+    "vad",
+    "visual_processing",  # Combined: motion, scenes, frame_decode, objects, faces, ocr, clip
+    "visual",  # Qwen VLM
+    "transcript",
+]
+def predict_extractor_time(
+    extractor: str,
+    resolution_bucket: str,
+    duration_seconds: float,
+    num_frames: int | None = None,
+    num_timestamps: int | None = None,
+    enabled_sub_extractors: set[str] | None = None,
+) -> float:
+    """Predict processing time for a single extractor on a single file.
+    Args:
+        extractor: Name of the extractor
+        resolution_bucket: Resolution category (720p, 1080p, 4k, etc.)
+        duration_seconds: Video duration in seconds
+        num_frames: Number of frames to process (for frame-based extractors)
+        num_timestamps: Number of timestamps for visual/VLM analysis
+        enabled_sub_extractors: For visual_processing, which sub-extractors are enabled
+    Returns:
+        Predicted processing time in seconds
+    """
+    # Duration in minutes for duration-based extractors
+    duration_minutes = duration_seconds / 60.0
+    # Extractors that scale with duration
+    if extractor in ("vad", "transcript"):
+        rate = get_predicted_rate(extractor, resolution_bucket)
+        if rate is None:
+            rate = DEFAULT_RATES.get(extractor, 1.0)
+        return rate * duration_minutes
+    # visual_processing: sum up time for each enabled sub-extractor
+    if extractor == "visual_processing":
+        total_time = 0.0
+        sub_extractors = enabled_sub_extractors or {"motion", "scenes", "frame_decode", "objects", "faces", "ocr", "clip"}
+        # Smart sampling typically uses ~20-50 frames, not duration*2
+        # Use a more conservative estimate
+        estimated_frames = num_frames if num_frames else min(50, max(10, int(duration_seconds / 2)))
+        for sub in sub_extractors:
+            rate = get_predicted_rate(sub, resolution_bucket)
+            if rate is None:
+                rate = DEFAULT_RATES.get(sub, 0.1)
+            # motion, scenes store raw seconds per file
+            # frame_decode, objects, faces, ocr, clip store seconds per frame
+            if sub in ("motion", "scenes"):
+                total_time += rate  # raw seconds per file
+            else:
+                total_time += rate * estimated_frames  # per-frame rate × frame count
+        return total_time
+    # Visual/Qwen scales with timestamps
+    if extractor == "visual":
+        rate = get_predicted_rate(extractor, resolution_bucket)
+        if rate is None:
+            rate = DEFAULT_RATES.get(extractor, 5.0)
+        timestamps = num_timestamps if num_timestamps else 5
+        return rate * timestamps
+    # Fixed-time extractors (metadata, telemetry)
+    rate = get_predicted_rate(extractor, resolution_bucket)
+    if rate is None:
+        rate = DEFAULT_RATES.get(extractor, 1.0)
+    return rate
+def get_enabled_extractors_from_request(
+    request: BatchRequest,
+) -> tuple[set[str], set[str]]:
+    """Get the set of enabled extractors from a batch request.
+    Returns:
+        Tuple of (main_extractors, sub_extractors within visual_processing)
+    """
+    enabled = {"metadata", "telemetry"}  # Always enabled
+    sub_extractors: set[str] = set()
+    if request.enable_vad:
+        enabled.add("vad")
+    # Track which sub-extractors are enabled within visual_processing
+    if request.enable_motion:
+        sub_extractors.add("motion")
+    if request.enable_scenes:
+        sub_extractors.add("scenes")
+    if request.enable_objects:
+        sub_extractors.update({"frame_decode", "objects"})
+    if request.enable_faces:
+        sub_extractors.update({"frame_decode", "faces"})
+    if request.enable_ocr:
+        sub_extractors.update({"frame_decode", "ocr"})
+    if request.enable_clip:
+        sub_extractors.update({"frame_decode", "clip"})
+    # visual_processing runs if any sub-extractor is enabled
+    if sub_extractors:
+        enabled.add("visual_processing")
+    if request.enable_visual:
+        enabled.add("visual")
+    if request.enable_transcript:
+        enabled.add("transcript")
+    return enabled, sub_extractors
+def calculate_queue_eta() -> tuple[float, int]:
+    """Calculate total ETA for all queued batches.
+    Returns: (total_seconds, batch_count)
+    """
+    from media_engine.batch.state import batch_queue, batch_queue_lock
+    total_eta = 0.0
+    batch_count = 0
+    with batch_queue_lock:
+        for _, request in batch_queue:
+            batch_count += 1
+            enabled, sub_extractors = get_enabled_extractors_from_request(request)
+            # Estimate time for each file in queued batch
+            for _file_path in request.files:
+                # Use average duration estimate if metadata not yet available
+                duration = 60.0  # Default: 1 minute estimate
+                resolution = "1080p"  # Default resolution
+                for ext in enabled:
+                    if ext in EXTRACTOR_ORDER:
+                        total_eta += predict_extractor_time(
+                            ext,
+                            resolution,
+                            duration,
+                            enabled_sub_extractors=sub_extractors if ext == "visual_processing" else None,
+                        )
+    return total_eta, batch_count
+# Load timing history on module import
+load_timing_history()

media_engine/cli.py ADDED Viewed

@@ -0,0 +1,17 @@
+"""CLI entry point for meng-server."""
+import uvicorn
+def run_server() -> None:
+    """Run the Media Engine API server."""
+    uvicorn.run(
+        "media_engine.main:app",
+        host="0.0.0.0",
+        port=8001,
+        reload=False,
+    )
+if __name__ == "__main__":
+    run_server()