PyPI - OTVision - Versions diffs - 0.5.3__py3-none-any.whl - Mend

OTVision 0.5.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (50) hide show

OTVision/__init__.py +30 -0
OTVision/application/__init__.py +0 -0
OTVision/application/configure_logger.py +23 -0
OTVision/application/detect/__init__.py +0 -0
OTVision/application/detect/get_detect_cli_args.py +9 -0
OTVision/application/detect/update_detect_config_with_cli_args.py +95 -0
OTVision/application/get_config.py +25 -0
OTVision/config.py +754 -0
OTVision/convert/__init__.py +0 -0
OTVision/convert/convert.py +318 -0
OTVision/dataformat.py +70 -0
OTVision/detect/__init__.py +0 -0
OTVision/detect/builder.py +48 -0
OTVision/detect/cli.py +166 -0
OTVision/detect/detect.py +296 -0
OTVision/detect/otdet.py +103 -0
OTVision/detect/plugin_av/__init__.py +0 -0
OTVision/detect/plugin_av/rotate_frame.py +37 -0
OTVision/detect/yolo.py +277 -0
OTVision/domain/__init__.py +0 -0
OTVision/domain/cli.py +42 -0
OTVision/helpers/__init__.py +0 -0
OTVision/helpers/date.py +26 -0
OTVision/helpers/files.py +538 -0
OTVision/helpers/formats.py +139 -0
OTVision/helpers/log.py +131 -0
OTVision/helpers/machine.py +71 -0
OTVision/helpers/video.py +54 -0
OTVision/track/__init__.py +0 -0
OTVision/track/iou.py +282 -0
OTVision/track/iou_util.py +140 -0
OTVision/track/preprocess.py +451 -0
OTVision/track/track.py +422 -0
OTVision/transform/__init__.py +0 -0
OTVision/transform/get_homography.py +156 -0
OTVision/transform/reference_points_picker.py +462 -0
OTVision/transform/transform.py +352 -0
OTVision/version.py +13 -0
OTVision/view/__init__.py +0 -0
OTVision/view/helpers/OTC.ico +0 -0
OTVision/view/view.py +90 -0
OTVision/view/view_convert.py +128 -0
OTVision/view/view_detect.py +146 -0
OTVision/view/view_helpers.py +417 -0
OTVision/view/view_track.py +131 -0
OTVision/view/view_transform.py +140 -0
otvision-0.5.3.dist-info/METADATA +47 -0
otvision-0.5.3.dist-info/RECORD +50 -0
otvision-0.5.3.dist-info/WHEEL +4 -0
otvision-0.5.3.dist-info/licenses/LICENSE +674 -0

OTVision/detect/detect.py ADDED Viewed

@@ -0,0 +1,296 @@
+"""
+OTVision main module to detect objects in single or multiple images or videos.
+"""
+# Copyright (C) 2022 OpenTrafficCam Contributors
+# <https://github.com/OpenTrafficCam
+# <team@opentrafficcam.org>
+#
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program.  If not, see <https://www.gnu.org/licenses/>.
+import logging
+import re
+from datetime import datetime, timedelta, timezone
+from pathlib import Path
+from tqdm import tqdm
+from OTVision.config import Config
+from OTVision.dataformat import DATA, LENGTH, METADATA, RECORDED_START_DATE, VIDEO
+from OTVision.detect.otdet import OtdetBuilder, OtdetBuilderConfig
+from OTVision.detect.yolo import create_model
+from OTVision.helpers.date import parse_date_string_to_utc_datime
+from OTVision.helpers.files import (
+    FILE_NAME_PATTERN,
+    START_DATE,
+    InproperFormattedFilename,
+    get_files,
+    write_json,
+)
+from OTVision.helpers.log import LOGGER_NAME
+from OTVision.helpers.video import get_duration, get_fps, get_video_dimensions
+from OTVision.track.preprocess import OCCURRENCE
+log = logging.getLogger(LOGGER_NAME)
+class OTVisionDetect:
+    @property
+    def config(self) -> Config:
+        if self._config is None:
+            raise ValueError("Config is missing!")
+        return self._config
+    def __init__(self, otdet_builder: OtdetBuilder) -> None:
+        self._config: Config | None = None
+        self._otdet_builder = otdet_builder
+    def update_config(self, config: Config) -> None:
+        self._config = config
+    def start(self) -> None:
+        """Starts the detection of objects in multiple videos and/or images.
+        Writes detections to one file per video/object.
+        """
+        filetypes = self.config.filetypes.video_filetypes.to_list()
+        video_files = get_files(paths=self.config.detect.paths, filetypes=filetypes)
+        start_msg = f"Start detection of {len(video_files)} video files"
+        log.info(start_msg)
+        print(start_msg)
+        if not video_files:
+            log.warning(f"No videos of type '{filetypes}' found to detect!")
+            return
+        model = create_model(
+            weights=self.config.detect.yolo_config.weights,
+            confidence=self.config.detect.yolo_config.conf,
+            iou=self.config.detect.yolo_config.iou,
+            img_size=self.config.detect.yolo_config.img_size,
+            half_precision=self.config.detect.half_precision,
+            normalized=self.config.detect.yolo_config.normalized,
+        )
+        for video_file in tqdm(video_files, desc="Detected video files", unit=" files"):
+            detections_file = derive_filename(
+                video_file=video_file,
+                detect_start=self.config.detect.detect_start,
+                detect_end=self.config.detect.detect_end,
+                detect_suffix=self.config.filetypes.detect,
+            )
+            if not self.config.detect.overwrite and detections_file.is_file():
+                log.warning(
+                    f"{detections_file} already exists. To overwrite, set overwrite "
+                    "to True"
+                )
+                continue
+            log.info(f"Detect {video_file}")
+            video_fps = get_fps(video_file)
+            detect_start_in_frames = convert_seconds_to_frames(
+                self.config.detect.detect_start, video_fps
+            )
+            detect_end_in_frames = convert_seconds_to_frames(
+                self.config.detect.detect_end, video_fps
+            )
+            detections = model.detect(
+                file=video_file,
+                detect_start=detect_start_in_frames,
+                detect_end=detect_end_in_frames,
+            )
+            video_width, video_height = get_video_dimensions(video_file)
+            actual_duration = get_duration(video_file)
+            actual_frames = len(detections)
+            if (expected_duration := self.config.detect.expected_duration) is not None:
+                actual_fps = actual_frames / expected_duration.total_seconds()
+            else:
+                actual_fps = actual_frames / actual_duration.total_seconds()
+            otdet = self._otdet_builder.add_config(
+                OtdetBuilderConfig(
+                    conf=model.confidence,
+                    iou=model.iou,
+                    video=video_file,
+                    video_width=video_width,
+                    video_height=video_height,
+                    expected_duration=expected_duration,
+                    recorded_fps=video_fps,
+                    actual_fps=actual_fps,
+                    actual_frames=actual_frames,
+                    detection_img_size=model.img_size,
+                    normalized=model.normalized,
+                    detection_model=model.weights,
+                    half_precision=model.half_precision,
+                    chunksize=1,
+                    classifications=model.classifications,
+                )
+            ).build(detections)
+            stamped_detections = add_timestamps(otdet, video_file, expected_duration)
+            write_json(
+                stamped_detections,
+                file=detections_file,
+                filetype=self.config.filetypes.detect,
+                overwrite=self.config.detect.overwrite,
+            )
+            log.info(f"Successfully detected and wrote {detections_file}")
+        finished_msg = "Finished detection"
+        log.info(finished_msg)
+        print(finished_msg)
+def derive_filename(
+    video_file: Path,
+    detect_suffix: str,
+    detect_start: int | None = None,
+    detect_end: int | None = None,
+) -> Path:
+    """
+    Generates a filename for detection files by appending specified start and end
+    markers and a suffix to the stem of the input video file.
+    Args:
+        video_file (Path): The input video file whose filename is to be modified.
+        detect_start (int | None): The starting marker to append to the filename.
+            If None, no starting marker will be appended.
+        detect_end (int | None): The ending marker to append to the filename. If None,
+            no ending marker will be appended.
+        detect_suffix (str): The file suffix to apply to the derived filename.
+    Returns:
+        Path: The modified video file path with the updated stem and suffix applied.
+    """
+    cutout = ""
+    if detect_start is not None:
+        cutout += f"_start_{detect_start}"
+    if detect_end is not None:
+        cutout += f"_end_{detect_end}"
+    new_stem = f"{video_file.stem}{cutout}"
+    return video_file.with_stem(new_stem).with_suffix(detect_suffix)
+def convert_seconds_to_frames(seconds: int | None, fps: float) -> int | None:
+    if seconds is None:
+        return None
+    return round(seconds * fps)
+class FormatNotSupportedError(Exception):
+    pass
+def add_timestamps(
+    detections: dict, video_file: Path, expected_duration: timedelta | None
+) -> dict:
+    return Timestamper().stamp(detections, video_file, expected_duration)
+class Timestamper:
+    def stamp(
+        self, detections: dict, video_file: Path, expected_duration: timedelta | None
+    ) -> dict:
+        """This method adds timestamps when the frame occurred in real time to each
+        frame.
+        Args:
+            detections (dict): dictionary containing all frames
+            video_file (Path): path to video file
+            expected_duration (timedelta | None): expected duration of the video used to
+                calculate the number of actual frames per second
+        Returns:
+            dict: input dictionary with additional occurrence per frame
+        """
+        start_time = self._get_start_time_from(video_file)
+        actual_duration = get_duration(video_file)
+        if expected_duration:
+            time_per_frame = self._get_time_per_frame(detections, expected_duration)
+        else:
+            time_per_frame = self._get_time_per_frame(detections, actual_duration)
+        self._update_metadata(detections, start_time, actual_duration)
+        return self._stamp(detections, start_time, time_per_frame)
+    @staticmethod
+    def _get_start_time_from(video_file: Path) -> datetime:
+        """Parse the given filename and retrieve the start date of the video.
+        Args:
+            video_file (Path): path to video file
+        Raises:
+            InproperFormattedFilename: if the filename is not formatted as expected, an
+            exception will be raised
+        Returns:
+            datetime: start date of the video
+        """
+        match = re.search(
+            FILE_NAME_PATTERN,
+            video_file.name,
+        )
+        if match:
+            start_date: str = match.group(START_DATE)
+            return parse_date_string_to_utc_datime(
+                start_date, "%Y-%m-%d_%H-%M-%S"
+            ).replace(tzinfo=timezone.utc)
+        raise InproperFormattedFilename(f"Could not parse {video_file.name}.")
+    @staticmethod
+    def _get_time_per_frame(detections: dict, duration: timedelta) -> timedelta:
+        """Calculates the duration for each frame. This is done using the total
+        duration of the video and the number of frames.
+        Args:
+            detections (dict): dictionary containing all frames
+            video_file (Path): path to video file
+        Returns:
+            timedelta: duration per frame
+        """
+        number_of_frames = len(detections[DATA].keys())
+        return duration / number_of_frames
+    @staticmethod
+    def _update_metadata(
+        detections: dict, start_time: datetime, duration: timedelta
+    ) -> dict:
+        detections[METADATA][VIDEO][RECORDED_START_DATE] = start_time.timestamp()
+        detections[METADATA][VIDEO][LENGTH] = str(duration)
+        return detections
+    def _stamp(
+        self, detections: dict, start_date: datetime, time_per_frame: timedelta
+    ) -> dict:
+        """Add a timestamp (occurrence in real time) to each frame.
+        Args:
+            detections (dict): dictionary containing all frames
+            start_date (datetime): start date of the video recording
+            time_per_frame (timedelta): duration per frame
+        Returns:
+            dict: dictionary containing all frames with their occurrence in real time
+        """
+        data: dict = detections[DATA]
+        for key, value in data.items():
+            occurrence = start_date + (int(key) - 1) * time_per_frame
+            value[OCCURRENCE] = occurrence.timestamp()
+        return detections

OTVision/detect/otdet.py ADDED Viewed

@@ -0,0 +1,103 @@
+from dataclasses import dataclass
+from datetime import timedelta
+from pathlib import Path
+from typing import Self
+from OTVision import dataformat, version
+from OTVision.track.preprocess import Detection
+@dataclass
+class OtdetBuilderConfig:
+    conf: float
+    iou: float
+    video: Path
+    video_width: int
+    video_height: int
+    expected_duration: timedelta | None
+    recorded_fps: float
+    actual_fps: float
+    actual_frames: int
+    detection_img_size: int
+    normalized: bool
+    detection_model: str | Path
+    half_precision: bool
+    chunksize: int
+    classifications: dict[int, str]
+class OtdetBuilderError(Exception):
+    pass
+class OtdetBuilder:
+    @property
+    def config(self) -> OtdetBuilderConfig:
+        if self._config is None:
+            raise OtdetBuilderError("Otdet builder config is not set")
+        return self._config
+    def __init__(self) -> None:
+        self._config: OtdetBuilderConfig | None = None
+    def add_config(self, config: OtdetBuilderConfig) -> Self:
+        self._config = config
+        return self
+    def reset(self) -> Self:
+        self._config = None
+        return self
+    def build(self, detections: list[list[Detection]]) -> dict:
+        result = {
+            dataformat.METADATA: self._build_metadata(),
+            dataformat.DATA: self._build_data(detections),
+        }
+        self.reset()
+        return result
+    def _build_metadata(self) -> dict:
+        return {
+            dataformat.OTDET_VERSION: version.otdet_version(),
+            dataformat.VIDEO: self._build_video_config(),
+            dataformat.DETECTION: self._build_detection_config(),
+        }
+    def _build_data(self, frames: list[list[Detection]]) -> dict:
+        data = {}
+        for frame, detections in enumerate(frames, start=1):
+            converted_detections = [detection.to_otdet() for detection in detections]
+            data[str(frame)] = {dataformat.DETECTIONS: converted_detections}
+        return data
+    def _build_video_config(self) -> dict:
+        video_config = {
+            dataformat.FILENAME: str(self.config.video.stem),
+            dataformat.FILETYPE: str(self.config.video.suffix),
+            dataformat.WIDTH: self.config.video_width,
+            dataformat.HEIGHT: self.config.video_height,
+            dataformat.RECORDED_FPS: self.config.recorded_fps,
+            dataformat.ACTUAL_FPS: self.config.actual_fps,
+            dataformat.NUMBER_OF_FRAMES: self.config.actual_frames,
+        }
+        if self.config.expected_duration is not None:
+            video_config[dataformat.EXPECTED_DURATION] = int(
+                self.config.expected_duration.total_seconds()
+            )
+        return video_config
+    def _build_detection_config(self) -> dict:
+        return {
+            dataformat.OTVISION_VERSION: version.otvision_version(),
+            dataformat.MODEL: {
+                dataformat.NAME: "YOLOv8",
+                dataformat.WEIGHTS: str(self.config.detection_model),
+                dataformat.IOU_THRESHOLD: self.config.iou,
+                dataformat.IMAGE_SIZE: self.config.detection_img_size,
+                dataformat.MAX_CONFIDENCE: self.config.conf,
+                dataformat.HALF_PRECISION: self.config.half_precision,
+                dataformat.CLASSES: self.config.classifications,
+            },
+            dataformat.CHUNKSIZE: self.config.chunksize,
+            dataformat.NORMALIZED_BBOX: self.config.normalized,
+        }

OTVision/detect/plugin_av/__init__.py ADDED Viewed

File without changes

OTVision/detect/plugin_av/rotate_frame.py ADDED Viewed

@@ -0,0 +1,37 @@
+from av import VideoFrame
+from numpy import ndarray, rot90
+DISPLAYMATRIX = "DISPLAYMATRIX"
+class AvVideoFrameRotator:
+    def __init__(self, img_format: str = "rgb24"):
+        self._img_format = img_format
+    def rotate(self, frame: VideoFrame, side_data: dict) -> ndarray:
+        array = frame.to_ndarray(format=self._img_format)
+        rotated_image = rotate(array, side_data)
+        return rotated_image
+def rotate(array: ndarray, side_data: dict) -> ndarray:
+    """
+    Rotate a numpy array using the DISPLAYMATRIX rotation angle defined in side_data.
+    Args:
+        array: to rotate
+        side_data: metadata dictionary to read the angle from
+    Returns: rotated array
+    """
+    if DISPLAYMATRIX in side_data:
+        angle = side_data[DISPLAYMATRIX]
+        if angle % 90 != 0:
+            raise ValueError(
+                f"Rotation angle must be multiple of 90 degrees, but is {angle}"
+            )
+        rotation = angle / 90
+        rotated_image = rot90(array, rotation)
+        return rotated_image
+    return array