PyPI - endoreg-db - Versions diffs - 0.8.4.2__py3-none-any.whl → 0.8.4.3__py3-none-any.whl - Mend - Supply Chain Defender

endoreg-db 0.8.4.2py3-none-any.whl → 0.8.4.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of endoreg-db might be problematic. Click here for more details.

Files changed (13) hide show

endoreg_db/services/video_import.py CHANGED Viewed

@@ -8,6 +8,7 @@ Changelog:
     October 14, 2025: Added file locking mechanism to prevent race conditions
                       during concurrent video imports (matches PDF import pattern)
 """
 from datetime import date
 import logging
 import sys
@@ -18,7 +19,6 @@ from contextlib import contextmanager
 from pathlib import Path
 from typing import Union, Dict, Any, Optional, List, Tuple
 from django.db import transaction
-from lx_anonymizer import FrameCleaner
 from moviepy import video
 from endoreg_db.models import VideoFile, SensitiveMeta
 from endoreg_db.utils.paths import STORAGE_DIR, VIDEO_DIR, ANONYM_VIDEO_DIR
@@ -35,50 +35,58 @@ MAX_LOCK_WAIT_SECONDS = 90  # New: wait up to 90s for a non-stale lock to clear
 logger = logging.getLogger(__name__)
-class VideoImportService():
+class VideoImportService:
     """
     Service for importing and anonymizing video files.
     Uses a central video instance pattern for cleaner state management.
     Features (October 14, 2025):
         - File locking to prevent concurrent processing of the same video
         - Stale lock detection and reclamation (600s timeout)
         - Hash-based duplicate detection
         - Graceful fallback processing without lx_anonymizer
     """
     def __init__(self, project_root: Optional[Path] = None):
         # Set up project root path
         if project_root:
             self.project_root = Path(project_root)
         else:
             self.project_root = Path(__file__).parent.parent.parent.parent
         # Track processed files to prevent duplicates
-        self.processed_files = set(str(Path(ANONYM_VIDEO_DIR) / file) for file in os.listdir(ANONYM_VIDEO_DIR))
+        try:
+            # Ensure anonym_video directory exists before listing files
+            anonym_video_dir = Path(ANONYM_VIDEO_DIR)
+            if anonym_video_dir.exists():
+                self.processed_files = set(str(anonym_video_dir / file) for file in os.listdir(ANONYM_VIDEO_DIR))
+            else:
+                logger.info(f"Creating anonym_videos directory: {anonym_video_dir}")
+                anonym_video_dir.mkdir(parents=True, exist_ok=True)
+                self.processed_files = set()
+        except Exception as e:
+            logger.warning(f"Failed to initialize processed files tracking: {e}")
+            self.processed_files = set()
         # Central video instance and processing context
         self.current_video: Optional[VideoFile] = None
         self.processing_context: Dict[str, Any] = {}
         self.delete_source = True
         self.logger = logging.getLogger(__name__)
-        self.cleaner = None # This gets instantiated in the perform_frame_cleaning method
     def _require_current_video(self) -> VideoFile:
         """Return the current VideoFile or raise if it has not been initialized."""
         if self.current_video is None:
             raise RuntimeError("Current video instance is not set")
         return self.current_video
     @contextmanager
     def _file_lock(self, path: Path):
         """
         Create a file lock to prevent duplicate processing of the same video.
         This context manager creates a .lock file alongside the video file.
         If the lock file already exists, it checks if it's stale (older than
         STALE_LOCK_SECONDS) and reclaims it if necessary. If it's not stale,
@@ -102,24 +110,21 @@ class VideoImportService():
                     except FileNotFoundError:
                         # Race: lock removed between exists and stat; retry acquire in next loop
                         age = None
                     if age is not None and age > STALE_LOCK_SECONDS:
                         try:
-                            logger.warning(
-                                "Stale lock detected for %s (age %.0fs). Reclaiming lock...",
-                                path, age
-                            )
+                            logger.warning("Stale lock detected for %s (age %.0fs). Reclaiming lock...", path, age)
                             lock_path.unlink()
                         except Exception as e:
                             logger.warning("Failed to remove stale lock %s: %s", lock_path, e)
                         # Loop continues and retries acquire immediately
                         continue
                     # Not stale: wait until deadline, then give up gracefully
                     if time.time() >= deadline:
                         raise ValueError(f"File already being processed: {path}")
                     time.sleep(1.0)
             os.write(fd, b"lock")
             os.close(fd)
             fd = None
@@ -132,11 +137,11 @@ class VideoImportService():
                     lock_path.unlink()
             except OSError:
                 pass
     def processed(self) -> bool:
         """Indicates if the current file has already been processed."""
-        return getattr(self, '_processed', False)
+        return getattr(self, "_processed", False)
     def import_and_anonymize(
         self,
         file_path: Union[Path, str],
@@ -149,11 +154,13 @@ class VideoImportService():
         High-level helper that orchestrates the complete video import and anonymization process.
         Uses the central video instance pattern for improved state management.
         """
+        # DEFENSIVE: Initialize processing_context immediately to prevent KeyError crashes
+        self.processing_context = {"file_path": Path(file_path)}
         try:
             # Initialize processing context
-            self._initialize_processing_context(file_path, center_name, processor_name,
-                                               save_video, delete_source)
+            self._initialize_processing_context(file_path, center_name, processor_name, save_video, delete_source)
             # Validate and prepare file (may raise ValueError if another worker holds a non-stale lock)
             try:
                 self._validate_and_prepare_file()
@@ -163,115 +170,119 @@ class VideoImportService():
                     self.logger.info(f"Skipping {file_path}: {ve}")
                     return None
                 raise
             # Create or retrieve video instance
             self._create_or_retrieve_video_instance()
             # Create sensitive meta file, ensure raw is moved out of processing folder watched by file watcher.
             self._create_sensitive_file()
             # Setup processing environment
             self._setup_processing_environment()
             # Process frames and metadata
             self._process_frames_and_metadata()
             # Finalize processing
             self._finalize_processing()
             # Move files and cleanup
             self._cleanup_and_archive()
             return self.current_video
         except Exception as e:
-            self.logger.error(f"Video import and anonymization failed for {file_path}: {e}")
+            # Safe file path access - handles cases where processing_context wasn't initialized
+            safe_file_path = getattr(self, "processing_context", {}).get("file_path", file_path)
+            # Debug: Log context state for troubleshooting
+            context_keys = list(getattr(self, "processing_context", {}).keys())
+            self.logger.debug(f"Context keys during error: {context_keys}")
+            self.logger.error(f"Video import and anonymization failed for {safe_file_path}: {e}")
             self._cleanup_on_error()
             raise
         finally:
             self._cleanup_processing_context()
-    def _initialize_processing_context(self, file_path: Union[Path, str], center_name: str,
-                                     processor_name: str, save_video: bool, delete_source: bool):
+    def _initialize_processing_context(self, file_path: Union[Path, str], center_name: str, processor_name: str, save_video: bool, delete_source: bool):
         """Initialize the processing context for the current video import."""
         self.processing_context = {
-            'file_path': Path(file_path),
-            'center_name': center_name,
-            'processor_name': processor_name,
-            'save_video': save_video,
-            'delete_source': delete_source,
-            'processing_started': False,
-            'frames_extracted': False,
-            'anonymization_completed': False,
-            'error_reason': None
+            "file_path": Path(file_path),
+            "center_name": center_name,
+            "processor_name": processor_name,
+            "save_video": save_video,
+            "delete_source": delete_source,
+            "processing_started": False,
+            "frames_extracted": False,
+            "anonymization_completed": False,
+            "error_reason": None,
         }
         self.logger.info(f"Initialized processing context for: {file_path}")
     def _validate_and_prepare_file(self):
         """
         Validate the video file and prepare for processing.
         Uses file locking to prevent concurrent processing of the same video file.
         This prevents race conditions where multiple workers might try to process
         the same video simultaneously.
         The lock is acquired here and held for the entire import process.
         See _file_lock() for lock reclamation logic.
         """
-        file_path = self.processing_context['file_path']
+        file_path = self.processing_context["file_path"]
         # Acquire file lock to prevent concurrent processing
         # Lock will be held until finally block in import_and_anonymize()
         try:
-            self.processing_context['_lock_context'] = self._file_lock(file_path)
-            self.processing_context['_lock_context'].__enter__()
+            self.processing_context["_lock_context"] = self._file_lock(file_path)
+            self.processing_context["_lock_context"].__enter__()
         except Exception:
             self._cleanup_processing_context()
             raise
         self.logger.info("Acquired file lock for: %s", file_path)
         # Check if already processed (memory-based check)
         if str(file_path) in self.processed_files:
             self.logger.info("File %s already processed, skipping", file_path)
             self._processed = True
             raise ValueError(f"File already processed: {file_path}")
         # Check file exists
         if not file_path.exists():
             raise FileNotFoundError(f"Video file not found: {file_path}")
         self.logger.info("File validation completed for: %s", file_path)
     def _create_or_retrieve_video_instance(self):
         """Create or retrieve the VideoFile instance and move to final storage."""
         self.logger.info("Creating VideoFile instance...")
         self.current_video = VideoFile.create_from_file_initialized(
-            file_path=self.processing_context['file_path'],
-            center_name=self.processing_context['center_name'],
-            processor_name=self.processing_context['processor_name'],
-            delete_source=self.processing_context['delete_source'],
-            save_video_file=self.processing_context['save_video'],
+            file_path=self.processing_context["file_path"],
+            center_name=self.processing_context["center_name"],
+            processor_name=self.processing_context["processor_name"],
+            delete_source=self.processing_context["delete_source"],
+            save_video_file=self.processing_context["save_video"],
         )
         if not self.current_video:
             raise RuntimeError("Failed to create VideoFile instance")
         # Immediately move to final storage locations
         self._move_to_final_storage()
         self.logger.info("Created VideoFile with UUID: %s", self.current_video.uuid)
         # Get and mark processing state
         state = VideoFile.get_or_create_state(self.current_video)
         if not state:
             raise RuntimeError("Failed to create VideoFile state")
         state.mark_processing_started(save=True)
-        self.processing_context['processing_started'] = True
+        self.processing_context["processing_started"] = True
     def _move_to_final_storage(self):
         """
@@ -348,7 +359,6 @@ class VideoImportService():
         self.processing_context["raw_video_path"] = stored_raw_path
         self.processing_context["video_filename"] = stored_raw_path.name
     def _setup_processing_environment(self):
         """Setup the processing environment without file movement."""
         video = self._require_current_video()
@@ -358,38 +368,38 @@ class VideoImportService():
         # Initialize frame objects in database
         video.initialize_frames()
         # Extract frames BEFORE processing to prevent pipeline 1 conflicts
         self.logger.info("Pre-extracting frames to avoid pipeline conflicts...")
         try:
             frames_extracted = video.extract_frames(overwrite=False)
             if frames_extracted:
-                self.processing_context['frames_extracted'] = True
+                self.processing_context["frames_extracted"] = True
                 self.logger.info("Frame extraction completed successfully")
                 # CRITICAL: Immediately save the frames_extracted state to database
                 # to prevent refresh_from_db() in pipeline 1 from overriding it
                 state = video.get_or_create_state()
                 if not state.frames_extracted:
                     state.frames_extracted = True
-                    state.save(update_fields=['frames_extracted'])
+                    state.save(update_fields=["frames_extracted"])
                     self.logger.info("Persisted frames_extracted=True to database")
             else:
                 self.logger.warning("Frame extraction failed, but continuing...")
-                self.processing_context['frames_extracted'] = False
+                self.processing_context["frames_extracted"] = False
         except Exception as e:
             self.logger.warning(f"Frame extraction failed during setup: {e}, but continuing...")
-            self.processing_context['frames_extracted'] = False
+            self.processing_context["frames_extracted"] = False
         # Ensure default patient data
         self._ensure_default_patient_data(video_instance=video)
         self.logger.info("Processing environment setup completed")
     def _process_frames_and_metadata(self):
         """Process frames and extract metadata with anonymization."""
         # Check frame cleaning availability
-        frame_cleaning_available, frame_cleaner  = self._ensure_frame_cleaning_available()
+        frame_cleaning_available, frame_cleaner = self._ensure_frame_cleaning_available()
         video = self._require_current_video()
         raw_file_field = video.raw_file
@@ -402,25 +412,25 @@ class VideoImportService():
         try:
             self.logger.info("Starting frame-level anonymization with processor ROI masking...")
             # Get processor ROI information
             endoscope_data_roi_nested, endoscope_image_roi = self._get_processor_roi_info()
             # Perform frame cleaning with timeout to prevent blocking
             from concurrent.futures import ThreadPoolExecutor, TimeoutError as FutureTimeoutError
             with ThreadPoolExecutor(max_workers=1) as executor:
                 future = executor.submit(self._perform_frame_cleaning, endoscope_data_roi_nested, endoscope_image_roi)
                 try:
                     # Increased timeout to better accommodate ffmpeg + OCR
-                    future.result(timeout=300)
-                    self.processing_context['anonymization_completed'] = True
+                    future.result(timeout=50000)
+                    self.processing_context["anonymization_completed"] = True
                     self.logger.info("Frame cleaning completed successfully within timeout")
                 except FutureTimeoutError:
                     self.logger.warning("Frame cleaning timed out; entering grace period check for cleaned output")
                     # Grace period: detect if cleaned file appears shortly after timeout
-                    raw_video_path = self.processing_context.get('raw_video_path')
-                    video_filename = self.processing_context.get('video_filename', Path(raw_video_path).name if raw_video_path else "video.mp4")
+                    raw_video_path = self.processing_context.get("raw_video_path")
+                    video_filename = self.processing_context.get("video_filename", Path(raw_video_path).name if raw_video_path else "video.mp4")
                     grace_seconds = 60
                     expected_cleaned_path: Optional[Path] = None
                     processed_field = video.processed_file
@@ -433,8 +443,8 @@ class VideoImportService():
                     if expected_cleaned_path is not None:
                         for _ in range(grace_seconds):
                             if expected_cleaned_path.exists():
-                                self.processing_context['cleaned_video_path'] = expected_cleaned_path
-                                self.processing_context['anonymization_completed'] = True
+                                self.processing_context["cleaned_video_path"] = expected_cleaned_path
+                                self.processing_context["anonymization_completed"] = True
                                 self.logger.info("Detected cleaned video during grace period: %s", expected_cleaned_path)
                                 found = True
                                 break
@@ -452,11 +462,10 @@ class VideoImportService():
             except Exception as fallback_error:
                 self.logger.error("Fallback anonymization also failed: %s", fallback_error)
                 # If even fallback fails, mark as not anonymized but continue import
-                self.processing_context['anonymization_completed'] = False
-                self.processing_context['error_reason'] = f"Frame cleaning failed: {e}, Fallback failed: {fallback_error}"
+                self.processing_context["anonymization_completed"] = False
+                self.processing_context["error_reason"] = f"Frame cleaning failed: {e}, Fallback failed: {fallback_error}"
     def _save_anonymized_video(self):
         original_raw_file_path_to_delete = None
         original_raw_frame_dir_to_delete = None
         video = self._require_current_video()
@@ -467,9 +476,7 @@ class VideoImportService():
         new_processed_hash = get_video_hash(anonymized_video_path)
         if video.__class__.objects.filter(processed_video_hash=new_processed_hash).exclude(pk=video.pk).exists():
-            raise ValueError(
-                f"Processed video hash {new_processed_hash} already exists for another video (Video: {video.uuid})."
-            )
+            raise ValueError(f"Processed video hash {new_processed_hash} already exists for another video (Video: {video.uuid}).")
         video.processed_video_hash = new_processed_hash
         video.processed_file.name = anonymized_video_path.relative_to(STORAGE_DIR).as_posix()
@@ -488,11 +495,11 @@ class VideoImportService():
             update_fields.extend(["raw_file", "video_hash"])
-            transaction.on_commit(lambda: _cleanup_raw_assets(
-                video_uuid=video.uuid,
-                raw_file_path=original_raw_file_path_to_delete,
-                raw_frame_dir=original_raw_frame_dir_to_delete
-            ))
+            transaction.on_commit(
+                lambda: _cleanup_raw_assets(
+                    video_uuid=video.uuid, raw_file_path=original_raw_file_path_to_delete, raw_frame_dir=original_raw_frame_dir_to_delete
+                )
+            )
         video.save(update_fields=update_fields)
         video.state.mark_anonymized(save=True)
@@ -510,20 +517,20 @@ class VideoImportService():
             if video is None:
                 self.logger.warning("No VideoFile instance available for fallback anonymization")
             # Strategy 2: Simple copy (no processing, just copy raw to processed)
             self.logger.info("Using simple copy fallback (raw video will be used as 'processed' video)")
-            self.processing_context['anonymization_completed'] = False
-            self.processing_context['use_raw_as_processed'] = True
+            self.processing_context["anonymization_completed"] = False
+            self.processing_context["use_raw_as_processed"] = True
             self.logger.warning("Fallback: Video will be imported without anonymization (raw copy used)")
         except Exception as e:
             self.logger.error(f"Error during fallback anonymization: {e}", exc_info=True)
-            self.processing_context['anonymization_completed'] = False
-            self.processing_context['error_reason'] = str(e)
+            self.processing_context["anonymization_completed"] = False
+            self.processing_context["error_reason"] = str(e)
     def _finalize_processing(self):
         """Finalize processing and update video state."""
         self.logger.info("Updating video processing state...")
         with transaction.atomic():
             video = self._require_current_video()
             try:
@@ -532,36 +539,33 @@ class VideoImportService():
                 self.logger.warning("Could not refresh VideoFile %s from DB: %s", video.uuid, refresh_error)
             state = video.get_or_create_state()
             # Only mark frames as extracted if they were successfully extracted
-            if self.processing_context.get('frames_extracted', False):
+            if self.processing_context.get("frames_extracted", False):
                 state.frames_extracted = True
                 self.logger.info("Marked frames as extracted in state")
             else:
                 self.logger.warning("Frames were not extracted, not updating state")
             # Always mark these as true (metadata extraction attempts were made)
             state.frames_initialized = True
             state.video_meta_extracted = True
             state.text_meta_extracted = True
             # ✅ FIX: Only mark as processed if anonymization actually completed
-            anonymization_completed = self.processing_context.get('anonymization_completed', False)
+            anonymization_completed = self.processing_context.get("anonymization_completed", False)
             if anonymization_completed:
                 state.mark_sensitive_meta_processed(save=False)
                 self.logger.info("Anonymization completed - marking sensitive meta as processed")
             else:
-                self.logger.warning(
-                    "Anonymization NOT completed - NOT marking as processed. "
-                    f"Reason: {self.processing_context.get('error_reason', 'Unknown')}"
-                )
+                self.logger.warning(f"Anonymization NOT completed - NOT marking as processed. Reason: {self.processing_context.get('error_reason', 'Unknown')}")
                 # Explicitly mark as NOT processed
                 state.sensitive_meta_processed = False
             # Save all state changes
             state.save()
             self.logger.info("Video processing state updated")
         # Signal completion
         self._signal_completion()
@@ -575,12 +579,12 @@ class VideoImportService():
         video = self._require_current_video()
         processed_video_path = None
-        if 'cleaned_video_path' in self.processing_context:
-            processed_video_path = self.processing_context['cleaned_video_path']
+        if "cleaned_video_path" in self.processing_context:
+            processed_video_path = self.processing_context["cleaned_video_path"]
         else:
-            raw_video_path = self.processing_context.get('raw_video_path')
+            raw_video_path = self.processing_context.get("raw_video_path")
             if raw_video_path and Path(raw_video_path).exists():
-                video_filename = self.processing_context.get('video_filename', Path(raw_video_path).name)
+                video_filename = self.processing_context.get("video_filename", Path(raw_video_path).name)
                 processed_filename = f"processed_{video_filename}"
                 processed_video_path = Path(raw_video_path).parent / processed_filename
                 try:
@@ -609,13 +613,13 @@ class VideoImportService():
                     except Exception as exc:
                         self.logger.error("Failed to update processed_file path: %s", exc)
                         video.processed_file.name = f"anonym_videos/{anonym_video_filename}"
-                        video.save(update_fields=['processed_file'])
+                        video.save(update_fields=["processed_file"])
                         self.logger.info(
                             "Updated processed_file path using fallback: %s",
                             f"anonym_videos/{anonym_video_filename}",
                         )
-                    self.processing_context['anonymization_completed'] = True
+                    self.processing_context["anonymization_completed"] = True
                 else:
                     self.logger.warning("Processed video file not found after move: %s", anonym_target_path)
             except Exception as exc:
@@ -625,13 +629,14 @@ class VideoImportService():
         try:
             from endoreg_db.utils.paths import RAW_FRAME_DIR
             shutil.rmtree(RAW_FRAME_DIR, ignore_errors=True)
             self.logger.debug("Cleaned up temporary frames directory: %s", RAW_FRAME_DIR)
         except Exception as exc:
             self.logger.warning("Failed to remove directory %s: %s", RAW_FRAME_DIR, exc)
-        source_path = self.processing_context['file_path']
-        if self.processing_context['delete_source'] and Path(source_path).exists():
+        source_path = self.processing_context["file_path"]
+        if self.processing_context["delete_source"] and Path(source_path).exists():
             try:
                 os.remove(source_path)
                 self.logger.info("Removed remaining source file: %s", source_path)
@@ -642,25 +647,25 @@ class VideoImportService():
             self.logger.warning("No processed_file found after cleanup - video will be unprocessed")
             try:
                 video.anonymize(delete_original_raw=self.delete_source)
-                video.save(update_fields=['processed_file'])
+                video.save(update_fields=["processed_file"])
                 self.logger.info("Late-stage anonymization succeeded")
             except Exception as e:
                 self.logger.error("Late-stage anonymization failed: %s", e)
-                self.processing_context['anonymization_completed'] = False
+                self.processing_context["anonymization_completed"] = False
         self.logger.info("Cleanup and archiving completed")
-        self.processed_files.add(str(self.processing_context['file_path']))
+        self.processed_files.add(str(self.processing_context["file_path"]))
         with transaction.atomic():
             video.refresh_from_db()
-            if hasattr(video, 'state') and self.processing_context.get('anonymization_completed'):
+            if hasattr(video, "state") and self.processing_context.get("anonymization_completed"):
                 video.state.mark_sensitive_meta_processed(save=True)
         self.logger.info("Import and anonymization completed for VideoFile UUID: %s", video.uuid)
         self.logger.info("Raw video stored in: /data/videos")
         self.logger.info("Processed video stored in: /data/anonym_videos")
     def _create_sensitive_file(
         self,
         video_instance: VideoFile | None = None,
@@ -719,11 +724,10 @@ class VideoImportService():
                 "Updated video.raw_file using fallback method: videos/sensitive/%s",
                 target_file_path.name,
             )
         self.processing_context["raw_video_path"] = target_file_path
         self.processing_context["video_filename"] = target_file_path.name
         self.logger.info("Created sensitive file for %s at %s", video.uuid, target_file_path)
         return target_file_path
@@ -740,7 +744,7 @@ class VideoImportService():
             if processor:
                 assert isinstance(processor, EndoscopyProcessor), "Processor is not of type EndoscopyProcessor"
                 endoscope_image_roi = processor.get_roi_endoscope_image()
-                endoscope_data_roi_nested = processor.get_rois()
+                endoscope_data_roi_nested = processor.get_sensitive_rois()
                 self.logger.info("Retrieved processor ROI information: endoscope_image_roi=%s", endoscope_image_roi)
             else:
                 self.logger.warning(
@@ -810,12 +814,10 @@ class VideoImportService():
                 except Exception as exc:
                     self.logger.error("Failed to update SensitiveMeta for video %s: %s", video.uuid, exc)
     def _ensure_frame_cleaning_available(self):
         """
         Ensure frame cleaning modules are available by adding lx-anonymizer to path.
         Returns:
             Tuple of (availability_flag, FrameCleaner_class, ReportReader_class)
         """
@@ -824,14 +826,12 @@ class VideoImportService():
             from lx_anonymizer import FrameCleaner  # type: ignore[import]
             if FrameCleaner:
-                return True, FrameCleaner()
+                return True, FrameCleaner
         except Exception as e:
             self.logger.warning(f"Frame cleaning not available: {e} Please install or update lx_anonymizer.")
-        return False, None
+        return False, None
     def _perform_frame_cleaning(self, endoscope_data_roi_nested, endoscope_image_roi):
         """Perform frame cleaning and anonymization."""
@@ -842,8 +842,8 @@ class VideoImportService():
             raise RuntimeError("Frame cleaning not available")
         # Prepare parameters for frame cleaning
-        raw_video_path = self.processing_context.get('raw_video_path')
+        raw_video_path = self.processing_context.get("raw_video_path")
         if not raw_video_path or not Path(raw_video_path).exists():
             try:
                 self.current_video = self._require_current_video()
@@ -851,35 +851,28 @@ class VideoImportService():
             except Exception:
                 raise RuntimeError(f"Raw video path not found: {raw_video_path}")
         # Create temporary output path for cleaned video
-        video_filename = self.processing_context.get('video_filename', Path(raw_video_path).name if raw_video_path else "video.mp4")
+        video_filename = self.processing_context.get("video_filename", Path(raw_video_path).name)
         cleaned_filename = f"cleaned_{video_filename}"
-        if not raw_video_path:
-            raise RuntimeError("raw_video_path is None after fallback, cannot construct cleaned_video_path")
         cleaned_video_path = Path(raw_video_path).parent / cleaned_filename
         # Clean video with ROI masking (heavy I/O operation)
         actual_cleaned_path, extracted_metadata = frame_cleaner.clean_video(
             video_path=Path(raw_video_path),
             endoscope_image_roi=endoscope_image_roi,
             endoscope_data_roi_nested=endoscope_data_roi_nested,
             output_path=cleaned_video_path,
-            technique="mask_overlay"
+            technique="mask_overlay",
         )
         # Store cleaned video path for later use in _cleanup_and_archive
-        self.processing_context['cleaned_video_path'] = actual_cleaned_path
-        self.processing_context['extracted_metadata'] = extracted_metadata
+        self.processing_context["cleaned_video_path"] = actual_cleaned_path
+        self.processing_context["extracted_metadata"] = extracted_metadata
         # Update sensitive metadata with extracted information
         self._update_sensitive_metadata(extracted_metadata)
         self.logger.info(f"Extracted metadata from frame cleaning: {extracted_metadata}")
         self.logger.info(f"Frame cleaning with ROI masking completed: {actual_cleaned_path}")
         self.logger.info("Cleaned video will be moved to anonym_videos during cleanup")
@@ -897,13 +890,13 @@ class VideoImportService():
         sm = sensitive_meta
         updated_fields = []
         try:
             sm.update_from_dict(extracted_metadata)
             updated_fields = list(extracted_metadata.keys())
         except KeyError as e:
             self.logger.warning(f"Failed to update SensitiveMeta field {e}")
         if updated_fields:
             sm.save(update_fields=updated_fields)
             self.logger.info("Updated SensitiveMeta fields for video %s: %s", video.uuid, updated_fields)
@@ -927,22 +920,18 @@ class VideoImportService():
                 except (ValueError, OSError):
                     raw_exists = False
-            video_processing_complete = (
-                video.sensitive_meta is not None and
-                video.video_meta is not None and
-                raw_exists
-            )
+            video_processing_complete = video.sensitive_meta is not None and video.video_meta is not None and raw_exists
             if video_processing_complete:
                 self.logger.info("Video %s processing completed successfully - ready for validation", video.uuid)
                 # Update completion flags if they exist
                 completion_fields = []
-                for field_name in ['import_completed', 'processing_complete', 'ready_for_validation']:
+                for field_name in ["import_completed", "processing_complete", "ready_for_validation"]:
                     if hasattr(video, field_name):
                         setattr(video, field_name, True)
                         completion_fields.append(field_name)
                 if completion_fields:
                     video.save(update_fields=completion_fields)
                     self.logger.info("Updated completion flags: %s", completion_fields)
@@ -951,15 +940,15 @@ class VideoImportService():
                     "Video %s processing incomplete - missing required components",
                     video.uuid,
                 )
         except Exception as e:
             self.logger.warning(f"Failed to signal completion status: {e}")
     def _cleanup_on_error(self):
         """Cleanup processing context on error."""
-        if self.current_video and hasattr(self.current_video, 'state'):
+        if self.current_video and hasattr(self.current_video, "state"):
             try:
-                if self.processing_context.get('processing_started'):
+                if self.processing_context.get("processing_started"):
                     self.current_video.state.frames_extracted = False
                     self.current_video.state.frames_initialized = False
                     self.current_video.state.video_meta_extracted = False
@@ -971,29 +960,32 @@ class VideoImportService():
     def _cleanup_processing_context(self):
         """
         Cleanup processing context and release file lock.
         This method is always called in the finally block of import_and_anonymize()
         to ensure the file lock is released even if processing fails.
         """
+        # DEFENSIVE: Ensure processing_context exists before accessing it
+        if not hasattr(self, "processing_context"):
+            self.processing_context = {}
         try:
             # Release file lock if it was acquired
-            lock_context = self.processing_context.get('_lock_context')
+            lock_context = self.processing_context.get("_lock_context")
             if lock_context is not None:
                 try:
                     lock_context.__exit__(None, None, None)
                     self.logger.info("Released file lock")
                 except Exception as e:
                     self.logger.warning(f"Error releasing file lock: {e}")
             # Remove file from processed set if processing failed
-            file_path = self.processing_context.get('file_path')
-            if file_path and not self.processing_context.get('anonymization_completed'):
+            file_path = self.processing_context.get("file_path")
+            if file_path and not self.processing_context.get("anonymization_completed"):
                 file_path_str = str(file_path)
                 if file_path_str in self.processed_files:
                     self.processed_files.remove(file_path_str)
                     self.logger.info(f"Removed {file_path_str} from processed files (failed processing)")
         except Exception as e:
             self.logger.warning(f"Error during context cleanup: {e}")
         finally:
@@ -1001,6 +993,7 @@ class VideoImportService():
             self.current_video = None
             self.processing_context = {}
 # Convenience function for callers/tests that expect a module-level import_and_anonymize
 def import_and_anonymize(
     file_path,
@@ -1019,4 +1012,4 @@ def import_and_anonymize(
         processor_name=processor_name,
         save_video=save_video,
         delete_source=delete_source,
-    )
+    )