PyPI - nedo-vision-worker - Versions diffs - 1.0.0__py3-none-any.whl - Mend

nedo-vision-worker 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (92) hide show

nedo_vision_worker/__init__.py +10 -0
nedo_vision_worker/cli.py +195 -0
nedo_vision_worker/config/ConfigurationManager.py +196 -0
nedo_vision_worker/config/__init__.py +1 -0
nedo_vision_worker/database/DatabaseManager.py +219 -0
nedo_vision_worker/database/__init__.py +1 -0
nedo_vision_worker/doctor.py +453 -0
nedo_vision_worker/initializer/AppInitializer.py +78 -0
nedo_vision_worker/initializer/__init__.py +1 -0
nedo_vision_worker/models/__init__.py +15 -0
nedo_vision_worker/models/ai_model.py +29 -0
nedo_vision_worker/models/auth.py +14 -0
nedo_vision_worker/models/config.py +9 -0
nedo_vision_worker/models/dataset_source.py +30 -0
nedo_vision_worker/models/logs.py +9 -0
nedo_vision_worker/models/ppe_detection.py +39 -0
nedo_vision_worker/models/ppe_detection_label.py +20 -0
nedo_vision_worker/models/restricted_area_violation.py +20 -0
nedo_vision_worker/models/user.py +10 -0
nedo_vision_worker/models/worker_source.py +19 -0
nedo_vision_worker/models/worker_source_pipeline.py +21 -0
nedo_vision_worker/models/worker_source_pipeline_config.py +24 -0
nedo_vision_worker/models/worker_source_pipeline_debug.py +15 -0
nedo_vision_worker/models/worker_source_pipeline_detection.py +14 -0
nedo_vision_worker/protos/AIModelService_pb2.py +46 -0
nedo_vision_worker/protos/AIModelService_pb2_grpc.py +140 -0
nedo_vision_worker/protos/DatasetSourceService_pb2.py +46 -0
nedo_vision_worker/protos/DatasetSourceService_pb2_grpc.py +140 -0
nedo_vision_worker/protos/HumanDetectionService_pb2.py +44 -0
nedo_vision_worker/protos/HumanDetectionService_pb2_grpc.py +140 -0
nedo_vision_worker/protos/PPEDetectionService_pb2.py +46 -0
nedo_vision_worker/protos/PPEDetectionService_pb2_grpc.py +140 -0
nedo_vision_worker/protos/VisionWorkerService_pb2.py +72 -0
nedo_vision_worker/protos/VisionWorkerService_pb2_grpc.py +471 -0
nedo_vision_worker/protos/WorkerSourcePipelineService_pb2.py +64 -0
nedo_vision_worker/protos/WorkerSourcePipelineService_pb2_grpc.py +312 -0
nedo_vision_worker/protos/WorkerSourceService_pb2.py +50 -0
nedo_vision_worker/protos/WorkerSourceService_pb2_grpc.py +183 -0
nedo_vision_worker/protos/__init__.py +1 -0
nedo_vision_worker/repositories/AIModelRepository.py +44 -0
nedo_vision_worker/repositories/DatasetSourceRepository.py +150 -0
nedo_vision_worker/repositories/PPEDetectionRepository.py +112 -0
nedo_vision_worker/repositories/RestrictedAreaRepository.py +88 -0
nedo_vision_worker/repositories/WorkerSourcePipelineDebugRepository.py +90 -0
nedo_vision_worker/repositories/WorkerSourcePipelineDetectionRepository.py +48 -0
nedo_vision_worker/repositories/WorkerSourcePipelineRepository.py +174 -0
nedo_vision_worker/repositories/WorkerSourceRepository.py +46 -0
nedo_vision_worker/repositories/__init__.py +1 -0
nedo_vision_worker/services/AIModelClient.py +362 -0
nedo_vision_worker/services/ConnectionInfoClient.py +57 -0
nedo_vision_worker/services/DatasetSourceClient.py +88 -0
nedo_vision_worker/services/FileToRTMPServer.py +78 -0
nedo_vision_worker/services/GrpcClientBase.py +155 -0
nedo_vision_worker/services/GrpcClientManager.py +141 -0
nedo_vision_worker/services/ImageUploadClient.py +82 -0
nedo_vision_worker/services/PPEDetectionClient.py +108 -0
nedo_vision_worker/services/RTSPtoRTMPStreamer.py +98 -0
nedo_vision_worker/services/RestrictedAreaClient.py +100 -0
nedo_vision_worker/services/SystemUsageClient.py +77 -0
nedo_vision_worker/services/VideoStreamClient.py +161 -0
nedo_vision_worker/services/WorkerSourceClient.py +215 -0
nedo_vision_worker/services/WorkerSourcePipelineClient.py +393 -0
nedo_vision_worker/services/WorkerSourceUpdater.py +134 -0
nedo_vision_worker/services/WorkerStatusClient.py +65 -0
nedo_vision_worker/services/__init__.py +1 -0
nedo_vision_worker/util/HardwareID.py +104 -0
nedo_vision_worker/util/ImageUploader.py +92 -0
nedo_vision_worker/util/Networking.py +94 -0
nedo_vision_worker/util/PlatformDetector.py +50 -0
nedo_vision_worker/util/SystemMonitor.py +299 -0
nedo_vision_worker/util/VideoProbeUtil.py +120 -0
nedo_vision_worker/util/__init__.py +1 -0
nedo_vision_worker/worker/CoreActionWorker.py +125 -0
nedo_vision_worker/worker/DataSenderWorker.py +168 -0
nedo_vision_worker/worker/DataSyncWorker.py +143 -0
nedo_vision_worker/worker/DatasetFrameSender.py +208 -0
nedo_vision_worker/worker/DatasetFrameWorker.py +412 -0
nedo_vision_worker/worker/PPEDetectionManager.py +86 -0
nedo_vision_worker/worker/PipelineActionWorker.py +129 -0
nedo_vision_worker/worker/PipelineImageWorker.py +116 -0
nedo_vision_worker/worker/RabbitMQListener.py +170 -0
nedo_vision_worker/worker/RestrictedAreaManager.py +85 -0
nedo_vision_worker/worker/SystemUsageManager.py +111 -0
nedo_vision_worker/worker/VideoStreamWorker.py +139 -0
nedo_vision_worker/worker/WorkerManager.py +155 -0
nedo_vision_worker/worker/__init__.py +1 -0
nedo_vision_worker/worker_service.py +264 -0
nedo_vision_worker-1.0.0.dist-info/METADATA +563 -0
nedo_vision_worker-1.0.0.dist-info/RECORD +92 -0
nedo_vision_worker-1.0.0.dist-info/WHEEL +5 -0
nedo_vision_worker-1.0.0.dist-info/entry_points.txt +2 -0
nedo_vision_worker-1.0.0.dist-info/top_level.txt +1 -0

nedo_vision_worker/worker/DatasetFrameSender.py ADDED Viewed

@@ -0,0 +1,208 @@
+import os
+import json
+import logging
+import time
+from pathlib import Path
+from typing import List, Dict, Optional
+from ..services.DatasetSourceClient import DatasetSourceClient
+from ..database.DatabaseManager import _get_storage_paths
+logger = logging.getLogger(__name__)
+class DatasetFrameSender:
+    """Handles batched sending of saved dataset frames to the backend."""
+    def __init__(self, server_host: str, token: str):
+        """
+        Initialize the Dataset Frame Sender.
+        Args:
+            server_host (str): Server host for sending frames
+            token (str): Authentication token
+        """
+        self.server_host = server_host
+        self.token = token
+        self.client = DatasetSourceClient(server_host)
+        # Get storage paths
+        storage_paths = _get_storage_paths()
+        self.dataset_frames_path = storage_paths["files"] / "dataset_frames"
+        # Track sent frames to avoid duplicates
+        self.sent_frames = set()
+    def send_pending_frames(self, max_batch_size: int = 10) -> Dict[str, int]:
+        """
+        Send pending dataset frames in batches.
+        Args:
+            max_batch_size (int): Maximum number of frames to send in one batch
+        Returns:
+            Dict[str, int]: Statistics of sent frames per dataset source
+        """
+        stats = {}
+        try:
+            if not self.dataset_frames_path.exists():
+                return stats
+            # Find all dataset source directories
+            for dataset_source_dir in self.dataset_frames_path.iterdir():
+                if not dataset_source_dir.is_dir():
+                    continue
+                dataset_source_id = dataset_source_dir.name
+                sent_count = self._send_frames_for_dataset_source(
+                    dataset_source_dir,
+                    dataset_source_id,
+                    max_batch_size
+                )
+                if sent_count > 0:
+                    stats[dataset_source_id] = sent_count
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error sending pending frames: {e}")
+        return stats
+    def _send_frames_for_dataset_source(self, dataset_source_dir: Path, dataset_source_id: str, max_batch_size: int) -> int:
+        """
+        Send frames for a specific dataset source.
+        Args:
+            dataset_source_dir (Path): Directory containing frames for this dataset source
+            dataset_source_id (str): ID of the dataset source
+            max_batch_size (int): Maximum frames to send in one batch
+        Returns:
+            int: Number of frames sent
+        """
+        sent_count = 0
+        try:
+            # Find all frame files (jpg) that haven't been sent yet
+            frame_files = []
+            for file_path in dataset_source_dir.glob("*.jpg"):
+                frame_uuid = file_path.stem.split('_')[0]  # Extract UUID from filename
+                if frame_uuid not in self.sent_frames:
+                    metadata_path = file_path.with_suffix('.json')
+                    if metadata_path.exists():
+                        frame_files.append((file_path, metadata_path, frame_uuid))
+            # Sort by timestamp (filename contains timestamp)
+            frame_files.sort(key=lambda x: x[0].name)
+            # Send frames in batches
+            for i in range(0, len(frame_files), max_batch_size):
+                batch = frame_files[i:i + max_batch_size]
+                if self._send_frame_batch(batch, dataset_source_id):
+                    sent_count += len(batch)
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error sending frames for dataset source {dataset_source_id}: {e}")
+        return sent_count
+    def _send_frame_batch(self, frame_batch: List[tuple], dataset_source_id: str) -> bool:
+        """
+        Send a batch of frames to the backend.
+        Args:
+            frame_batch (List[tuple]): List of (file_path, metadata_path, frame_uuid) tuples
+            dataset_source_id (str): ID of the dataset source
+        Returns:
+            bool: True if batch was sent successfully
+        """
+        try:
+            for file_path, metadata_path, frame_uuid in frame_batch:
+                # Read frame data
+                with open(file_path, 'rb') as f:
+                    frame_bytes = f.read()
+                # Read metadata
+                with open(metadata_path, 'r') as f:
+                    metadata = json.load(f)
+                # Send frame to backend
+                response = self.client.send_dataset_frame(
+                    dataset_source_id=metadata["dataset_source_id"],
+                    uuid=metadata["frame_uuid"],
+                    image=frame_bytes,
+                    timestamp=metadata["timestamp"],
+                    token=self.token
+                )
+                if response and response.get("success"):
+                    # Mark as sent and clean up local files
+                    self.sent_frames.add(frame_uuid)
+                    self._cleanup_sent_frame(file_path, metadata_path)
+                    logger.debug(f"✅ [APP] Sent frame {frame_uuid} for dataset source {dataset_source_id}")
+                else:
+                    error_message = response.get("message", "Unknown error") if response else "Unknown error"
+                    # Handle specific error cases
+                    if "DatasetSource not found" in error_message:
+                        logger.warning(f"🗑️ [APP] Dataset source {dataset_source_id} not found, cleaning up orphaned frame {frame_uuid}")
+                        # Mark as sent to avoid retry loops and clean up
+                        self.sent_frames.add(frame_uuid)
+                        self._cleanup_sent_frame(file_path, metadata_path)
+                    else:
+                        logger.error(f"❌ [APP] Failed to send frame {frame_uuid}: {error_message}")
+                        return False
+            return True
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error sending frame batch: {e}")
+            return False
+    def _cleanup_sent_frame(self, file_path: Path, metadata_path: Path):
+        """
+        Clean up local files after successful send.
+        Args:
+            file_path (Path): Path to the frame file
+            metadata_path (Path): Path to the metadata file
+        """
+        try:
+            # Remove frame file
+            if file_path.exists():
+                file_path.unlink()
+            # Remove metadata file
+            if metadata_path.exists():
+                metadata_path.unlink()
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error cleaning up sent frame: {e}")
+    def get_pending_frame_count(self) -> int:
+        """
+        Get the total number of pending frames to be sent.
+        Returns:
+            int: Number of pending frames
+        """
+        pending_count = 0
+        try:
+            if not self.dataset_frames_path.exists():
+                return 0
+            for dataset_source_dir in self.dataset_frames_path.iterdir():
+                if not dataset_source_dir.is_dir():
+                    continue
+                for file_path in dataset_source_dir.glob("*.jpg"):
+                    frame_uuid = file_path.stem.split('_')[0]
+                    if frame_uuid not in self.sent_frames:
+                        pending_count += 1
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error counting pending frames: {e}")
+        return pending_count

nedo_vision_worker/worker/DatasetFrameWorker.py ADDED Viewed

@@ -0,0 +1,412 @@
+import threading
+import time
+import logging
+import uuid
+from datetime import datetime
+from typing import Dict
+from ..services.WorkerSourcePipelineClient import WorkerSourcePipelineClient
+from ..services.GrpcClientManager import GrpcClientManager
+from ..repositories.DatasetSourceRepository import DatasetSourceRepository
+logger = logging.getLogger(__name__)
+def safe_join_thread(thread, timeout=5):
+    """Safely join a thread, avoiding RuntimeError when joining current thread."""
+    if thread and thread != threading.current_thread():
+        thread.join(timeout=timeout)
+    elif thread == threading.current_thread():
+        logging.info("🛑 [APP] Thread stopping from within itself, skipping join.")
+class DatasetSourceThread:
+    """Individual thread for handling a single dataset source."""
+    def __init__(self, dataset_source, pipeline_client, storage_path):
+        self.dataset_source = dataset_source
+        self.pipeline_client = pipeline_client
+        self.storage_path = storage_path
+        self.thread = None
+        self.stop_event = threading.Event()
+        self.last_frame_time = 0
+        self.lock = threading.Lock()
+        # Create storage directory for this dataset source
+        self.dataset_storage_path = storage_path / "dataset_frames" / dataset_source.id
+        self.dataset_storage_path.mkdir(parents=True, exist_ok=True)
+        # Track consecutive failures
+        self.consecutive_failures = 0
+        self.max_consecutive_failures = 5
+    def start(self):
+        """Start the dataset source thread."""
+        if self.thread and self.thread.is_alive():
+            logger.warning(f"⚠️ [APP] Thread for dataset source {self.dataset_source.id} is already running.")
+            return
+        self.stop_event.clear()
+        self.consecutive_failures = 0  # Reset failure counter
+        self.thread = threading.Thread(
+            target=self._run,
+            daemon=True,
+            name=f"DatasetSource-{self.dataset_source.id}"
+        )
+        self.thread.start()
+        logger.info(f"🚀 [APP] Started thread for dataset source {self.dataset_source.id} ({self.dataset_source.dataset_name})")
+    def stop(self):
+        """Stop the dataset source thread."""
+        if not self.thread or not self.thread.is_alive():
+            return
+        self.stop_event.set()
+        safe_join_thread(self.thread)
+        logger.info(f"🛑 [APP] Stopped thread for dataset source {self.dataset_source.id}")
+    def _run(self):
+        """Main loop for this dataset source."""
+        try:
+            while not self.stop_event.is_set():
+                current_time = time.time()
+                # Check if it's time to capture a frame
+                if (current_time - self.last_frame_time) >= self.dataset_source.sampling_interval:
+                    success = self._capture_frame()
+                    with self.lock:
+                        self.last_frame_time = current_time
+                        if success:
+                            self.consecutive_failures = 0  # Reset on success
+                        else:
+                            self.consecutive_failures += 1
+                    # If too many consecutive failures, log warning and pause
+                    if self.consecutive_failures >= self.max_consecutive_failures:
+                        logger.warning(f"⚠️ [APP] Dataset source {self.dataset_source.id} has {self.consecutive_failures} consecutive failures. Pausing for 30 seconds.")
+                        time.sleep(30)  # Pause for 30 seconds
+                        self.consecutive_failures = 0  # Reset after pause
+                # Sleep for a shorter interval to be more responsive
+                time.sleep(min(1, self.dataset_source.sampling_interval / 10))
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error in dataset source thread {self.dataset_source.id}: {e}", exc_info=True)
+    def _capture_frame(self):
+        """Capture and save a frame for this dataset source. Returns True if successful."""
+        try:
+            # Get frame from source
+            frame_bytes = self._get_frame_from_source(self.dataset_source.worker_source_url)
+            if frame_bytes:
+                # Generate unique filename
+                timestamp = int(time.time() * 1000)
+                frame_uuid = str(uuid.uuid4())
+                filename = f"{frame_uuid}_{timestamp}.jpg"
+                file_path = self.dataset_storage_path / filename
+                # Save frame to local storage
+                with open(file_path, 'wb') as f:
+                    f.write(frame_bytes)
+                # Create metadata file
+                metadata = {
+                    "dataset_source_id": self.dataset_source.id,
+                    "dataset_id": self.dataset_source.dataset_id,
+                    "worker_source_id": self.dataset_source.worker_source_id,
+                    "dataset_name": self.dataset_source.dataset_name,
+                    "worker_source_name": self.dataset_source.worker_source_name,
+                    "worker_source_url": self.dataset_source.worker_source_url,
+                    "frame_uuid": frame_uuid,
+                    "timestamp": timestamp,
+                    "captured_at": datetime.utcnow().isoformat()
+                }
+                metadata_path = file_path.with_suffix('.json')
+                import json
+                with open(metadata_path, 'w') as f:
+                    json.dump(metadata, f, indent=2)
+                logger.info(f"📸 [APP] Captured frame for {self.dataset_source.dataset_name} (ID: {self.dataset_source.id})")
+                return True
+            else:
+                logger.warning(f"⚠️ [APP] Could not get frame from source {self.dataset_source.worker_source_url}")
+                return False
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error capturing frame for {self.dataset_source.dataset_name}: {e}", exc_info=True)
+            return False
+    def _get_frame_from_source(self, source_url):
+        """Get a frame from the given source URL."""
+        try:
+            stream_type = self.pipeline_client._detect_stream_type(source_url)
+            if stream_type == "video_file":
+                logger.info(f"🎬 [APP] Capturing video frame from {source_url}")
+            elif stream_type == "image_file":
+                logger.info(f"🖼️ [APP] Capturing image frame from {source_url}")
+            elif stream_type in ["rtsp", "hls"]:
+                logger.info(f"📡 [APP] Capturing live stream frame from {source_url}")
+            frame_bytes = self.pipeline_client._get_single_frame_bytes(source_url)
+            if frame_bytes and stream_type == "video_file":
+                status = self.pipeline_client.get_video_positions_status()
+                for video_path, info in status.items():
+                    if info["duration"]:
+                        logger.info(f"📊 [APP] Video progress: {info['progress_percent']:.1f}% ({info['current_position']:.2f}s / {info['duration']:.2f}s)")
+            return frame_bytes
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error getting frame from source {source_url}: {e}", exc_info=True)
+            return None
+class DatasetFrameWorker:
+    def __init__(self, config: dict):
+        """
+        Initialize Dataset Frame Worker.
+        Args:
+            config (dict): Configuration object containing settings.
+        """
+        if not isinstance(config, dict):
+            raise ValueError("⚠️ [APP] config must be a dictionary.")
+        self.config = config
+        self.worker_id = self.config.get("worker_id")
+        self.server_host = self.config.get("server_host")
+        self.token = self.config.get("token")
+        if not self.worker_id:
+            raise ValueError("⚠️ [APP] Configuration is missing 'worker_id'.")
+        if not self.token:
+            raise ValueError("⚠️ [APP] Configuration is missing 'token'.")
+        self.dataset_source_repo = DatasetSourceRepository()
+        # Get shared client instance from the centralized manager
+        self.client_manager = GrpcClientManager.get_instance()
+        self.worker_source_pipeline_client = self.client_manager.get_client(WorkerSourcePipelineClient)
+        self.thread = None
+        self.stop_event = threading.Event()
+        self.lock = threading.Lock()
+        # Cache for dataset source threads
+        self.dataset_source_threads: Dict[str, DatasetSourceThread] = {}
+        self.last_sync_time = 0
+        self.sync_interval = 30  # Sync dataset sources every 30 seconds
+        # Thread for syncing dataset sources
+        self.sync_thread = None
+        # Sync lock to prevent multiple simultaneous sync operations
+        self.sync_lock = threading.Lock()
+        # Storage path for dataset frames
+        from ..database.DatabaseManager import get_storage_path
+        self.storage_path = get_storage_path("files")
+    def start(self):
+        """Start the Dataset Frame Worker."""
+        with self.lock:
+            if self.thread and self.thread.is_alive():
+                logger.warning("⚠️ [APP] Dataset Frame Worker is already running.")
+                return
+            self.stop_event.clear()
+            # Start sync thread
+            self.sync_thread = threading.Thread(target=self._sync_loop, daemon=True)
+            self.sync_thread.start()
+            # Start main worker thread
+            self.thread = threading.Thread(target=self._run, daemon=True)
+            self.thread.start()
+            logger.info(f"🚀 [APP] Dataset Frame Worker started (Device: {self.worker_id}).")
+    def stop(self):
+        """Stop the Dataset Frame Worker."""
+        with self.lock:
+            if not self.thread or not self.thread.is_alive():
+                logger.warning("⚠️ [APP] Dataset Frame Worker is not running.")
+                return
+            self.stop_event.set()
+            # Stop all dataset source threads
+            for thread in self.dataset_source_threads.values():
+                thread.stop()
+            # Wait for threads to stop
+            if self.thread:
+                safe_join_thread(self.thread)
+            if self.sync_thread:
+                safe_join_thread(self.sync_thread)
+            self.thread = None
+            self.sync_thread = None
+            logger.info(f"🛑 [APP] Dataset Frame Worker stopped (Device: {self.worker_id}).")
+    def _run(self):
+        """Main loop for managing dataset source threads."""
+        try:
+            while not self.stop_event.is_set():
+                self._manage_dataset_source_threads()
+                time.sleep(5)  # Check every 5 seconds
+        except Exception as e:
+            logger.error("🚨 [APP] Unexpected error in Dataset Frame Worker main loop.", exc_info=True)
+    def _sync_loop(self):
+        """Background thread for syncing dataset sources."""
+        try:
+            while not self.stop_event.is_set():
+                self._sync_dataset_sources()
+                time.sleep(self.sync_interval)
+        except Exception as e:
+            logger.error("🚨 [APP] Error in dataset source sync loop.", exc_info=True)
+    def _sync_dataset_sources(self):
+        """Sync dataset sources from server."""
+        # Prevent multiple simultaneous sync operations
+        if not self.sync_lock.acquire(blocking=False):
+            logger.debug("🔄 [APP] Sync operation already in progress, skipping...")
+            return
+        try:
+            from ..services.DatasetSourceClient import DatasetSourceClient
+            # Use shared client instead of creating new instance
+            client = self.client_manager.get_client(DatasetSourceClient, "DatasetSourceClient")
+            response = client.get_dataset_source_list(self.token)
+            if response and response.get("success"):
+                dataset_sources_data = response.get("data", [])
+                self.dataset_source_repo.sync_dataset_sources(dataset_sources_data)
+                self.last_sync_time = time.time()
+            else:
+                error_message = response.get("message", "Unknown error") if response else "Unknown error"
+                logger.error(f"❌ [APP] Failed to sync dataset sources: {error_message}")
+        except Exception as e:
+            logger.error("🚨 [APP] Error syncing dataset sources.", exc_info=True)
+        finally:
+            self.sync_lock.release()
+    def _cleanup_orphaned_frames(self, deleted_dataset_source_ids):
+        """Clean up frames for deleted dataset sources."""
+        try:
+            for dataset_source_id in deleted_dataset_source_ids:
+                orphaned_frames_path = self.storage_path / "dataset_frames" / dataset_source_id
+                if orphaned_frames_path.exists():
+                    import shutil
+                    shutil.rmtree(orphaned_frames_path)
+                    logger.info(f"🗑️ [APP] Cleaned up orphaned frames for deleted dataset source {dataset_source_id}")
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error cleaning up orphaned frames: {e}", exc_info=True)
+    def _manage_dataset_source_threads(self):
+        """Manage dataset source threads based on current dataset sources."""
+        try:
+            # Get current dataset sources from local database
+            dataset_sources = self.dataset_source_repo.get_all_dataset_sources()
+            current_dataset_source_ids = {ds.id for ds in dataset_sources}
+            # Stop threads for dataset sources that no longer exist
+            threads_to_remove = []
+            deleted_dataset_source_ids = []
+            for dataset_source_id, thread in self.dataset_source_threads.items():
+                if dataset_source_id not in current_dataset_source_ids:
+                    logger.info(f"🛑 [APP] Stopping thread for deleted dataset source {dataset_source_id}")
+                    thread.stop()
+                    threads_to_remove.append(dataset_source_id)
+                    deleted_dataset_source_ids.append(dataset_source_id)
+            for dataset_source_id in threads_to_remove:
+                del self.dataset_source_threads[dataset_source_id]
+            # Clean up orphaned frames for deleted dataset sources
+            if deleted_dataset_source_ids:
+                self._cleanup_orphaned_frames(deleted_dataset_source_ids)
+            # Process current dataset sources
+            for dataset_source in dataset_sources:
+                if dataset_source.id not in self.dataset_source_threads:
+                    # Create new thread for new dataset source
+                    logger.info(f"🆕 [APP] Creating new thread for dataset source {dataset_source.id} ({dataset_source.dataset_name})")
+                    thread = DatasetSourceThread(
+                        dataset_source=dataset_source,
+                        pipeline_client=self.worker_source_pipeline_client,
+                        storage_path=self.storage_path
+                    )
+                    self.dataset_source_threads[dataset_source.id] = thread
+                    thread.start()
+                else:
+                    # Update existing thread with new dataset source data
+                    existing_thread = self.dataset_source_threads[dataset_source.id]
+                    if self._dataset_source_changed(existing_thread.dataset_source, dataset_source):
+                        logger.info(f"🔄 [APP] Updating thread for dataset source {dataset_source.id} ({dataset_source.dataset_name})")
+                        # Stop the old thread
+                        existing_thread.stop()
+                        # Create new thread with updated data
+                        new_thread = DatasetSourceThread(
+                            dataset_source=dataset_source,
+                            pipeline_client=self.worker_source_pipeline_client,
+                            storage_path=self.storage_path
+                        )
+                        self.dataset_source_threads[dataset_source.id] = new_thread
+                        new_thread.start()
+            # Log current status
+            active_threads = len([t for t in self.dataset_source_threads.values() if t.thread and t.thread.is_alive()])
+            logger.debug(f"📊 [APP] Dataset Frame Worker status: {active_threads} active threads, {len(dataset_sources)} total dataset sources")
+        except Exception as e:
+            logger.error("🚨 [APP] Error managing dataset source threads.", exc_info=True)
+    def _dataset_source_changed(self, old_dataset_source, new_dataset_source):
+        """Check if dataset source data has changed significantly."""
+        try:
+            # Compare relevant fields that would affect thread behavior
+            fields_to_compare = [
+                'worker_source_url',
+                'sampling_interval',
+                'dataset_name',
+                'worker_source_name',
+                'dataset_id',
+                'worker_source_id'
+            ]
+            for field in fields_to_compare:
+                old_value = getattr(old_dataset_source, field, None)
+                new_value = getattr(new_dataset_source, field, None)
+                if old_value != new_value:
+                    logger.debug(f"🔄 [APP] Dataset source {new_dataset_source.id} field '{field}' changed: {old_value} -> {new_value}")
+                    return True
+            return False
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error comparing dataset sources: {e}", exc_info=True)
+            return True  # Assume changed if comparison fails
+    def get_status(self):
+        """Get current status of dataset frame worker."""
+        try:
+            dataset_sources = self.dataset_source_repo.get_all_dataset_sources()
+            active_threads = [t for t in self.dataset_source_threads.values() if t.thread and t.thread.is_alive()]
+            return {
+                "total_dataset_sources": len(dataset_sources),
+                "active_threads": len(active_threads),
+                "thread_details": [
+                    {
+                        "dataset_source_id": t.dataset_source.id,
+                        "dataset_name": t.dataset_source.dataset_name,
+                        "is_alive": t.thread.is_alive() if t.thread else False,
+                        "consecutive_failures": t.consecutive_failures
+                    }
+                    for t in self.dataset_source_threads.values()
+                ]
+            }
+        except Exception as e:
+            logger.error(f"🚨 [APP] Error getting dataset frame worker status: {e}", exc_info=True)
+            return {"error": str(e)}