PyPI - OTVision - Versions diffs - 0.6.0__py3-none-any.whl → 0.6.2__py3-none-any.whl - Mend

OTVision 0.6.0py3-none-any.whl → 0.6.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

OTVision/detect/cli.py +2 -2
OTVision/helpers/files.py +10 -2
OTVision/helpers/input_types.py +15 -0
OTVision/track/exporter/__init__.py +0 -0
OTVision/track/exporter/filebased_exporter.py +24 -0
OTVision/track/model/__init__.py +0 -0
OTVision/track/model/detection.py +141 -0
OTVision/track/model/filebased/__init__.py +0 -0
OTVision/track/model/filebased/frame_chunk.py +203 -0
OTVision/track/model/filebased/frame_group.py +95 -0
OTVision/track/model/frame.py +149 -0
OTVision/track/model/track_exporter.py +119 -0
OTVision/track/model/tracking_interfaces.py +309 -0
OTVision/track/parser/__init__.py +0 -0
OTVision/track/parser/chunk_parser_plugins.py +99 -0
OTVision/track/parser/frame_group_parser_plugins.py +127 -0
OTVision/track/track.py +54 -332
OTVision/track/tracker/__init__.py +0 -0
OTVision/track/tracker/filebased_tracking.py +197 -0
OTVision/track/tracker/tracker_plugin_iou.py +228 -0
OTVision/version.py +1 -1
OTVision/view/view_track.py +1 -1
{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/METADATA +4 -3
{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/RECORD +26 -12
OTVision/track/iou.py +0 -282
OTVision/track/iou_util.py +0 -140
OTVision/track/preprocess.py +0 -453
{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/WHEEL +0 -0
{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/licenses/LICENSE +0 -0

OTVision/track/iou_util.py DELETED Viewed

@@ -1,140 +0,0 @@
-"""
-Utils for using iou tracker
-"""
-# ---------------------------------------------------------
-# IOU Tracker
-# Copyright (c) 2017 TU Berlin, Communication Systems Group
-# Licensed under The MIT License, see
-# https://github.com/bochinski/iou-tracker/blob/master/LICENSE
-# for details.
-# Written by Erik Bochinski
-# ---------------------------------------------------------
-from typing import Union
-import numpy as np
-# TODO: Remove if not needed
-def nms(
-    boxes: np.ndarray,
-    scores: np.ndarray,
-    overlapThresh: float,
-    classes: Union[np.ndarray, None] = None,
-) -> Union[tuple[np.ndarray, np.ndarray, np.ndarray], tuple[np.ndarray, np.ndarray]]:
-    """
-    perform non-maximum suppression. based on Malisiewicz et al.
-    Args:
-        boxes (numpy.ndarray): boxes to process
-        scores (numpy.ndarray): corresponding scores for each box
-        overlapThresh (float): overlap threshold for boxes to merge
-        classes (numpy.ndarray, optional): class ids for each box.
-    Returns:
-        (tuple): tuple containing:
-        boxes (list): nms boxes
-        scores (list): nms scores
-        classes (list, optional): nms classes if specified
-    """
-    # # if there are no boxes, return an empty list
-    # if len(boxes) == 0:
-    #     return [], [], [] if classes else [], []
-    # if the bounding boxes integers, convert them to floats --
-    # this is important since we'll be doing a bunch of divisions
-    if boxes.dtype.kind == "i":
-        boxes = boxes.astype("float")
-    if scores.dtype.kind == "i":
-        scores = scores.astype("float")
-    # initialize the list of picked indexes
-    pick = []
-    # grab the coordinates of the bounding boxes
-    x1 = boxes[:, 0]
-    y1 = boxes[:, 1]
-    x2 = boxes[:, 2]
-    y2 = boxes[:, 3]
-    # score = boxes[:, 4]
-    # compute the area of the bounding boxes and sort the bounding
-    # boxes by the bottom-right y-coordinate of the bounding box
-    area = (x2 - x1 + 1) * (y2 - y1 + 1)
-    idxs = np.argsort(scores)
-    # keep looping while some indexes still remain in the indexes
-    # list
-    while len(idxs) > 0:
-        # grab the last index in the indexes list and add the
-        # index value to the list of picked indexes
-        last = len(idxs) - 1
-        i = idxs[last]
-        pick.append(i)
-        # find the largest (x, y) coordinates for the start of
-        # the bounding box and the smallest (x, y) coordinates
-        # for the end of the bounding box
-        xx1 = np.maximum(x1[i], x1[idxs[:last]])
-        yy1 = np.maximum(y1[i], y1[idxs[:last]])
-        xx2 = np.minimum(x2[i], x2[idxs[:last]])
-        yy2 = np.minimum(y2[i], y2[idxs[:last]])
-        # compute the width and height of the bounding box
-        w = np.maximum(0, xx2 - xx1 + 1)
-        h = np.maximum(0, yy2 - yy1 + 1)
-        # compute the ratio of overlap
-        overlap = (w * h) / area[idxs[:last]]
-        # delete all indexes from the index list that have
-        idxs = np.delete(
-            idxs,
-            np.concatenate((np.array([last]), np.where(overlap > overlapThresh)[0])),
-        )
-    if classes is not None:
-        return boxes[pick], scores[pick], classes[pick]
-    else:
-        return boxes[pick], scores[pick]
-def iou(
-    bbox1: Union[list[float], tuple[float, float, float, float]],
-    bbox2: Union[list[float], tuple[float, float, float, float]],
-) -> float:
-    """
-    Calculates the intersection-over-union of two bounding boxes.
-    Args:
-        bbox1 (list of floats): bounding box in format x1,y1,x2,y2.
-        bbox2 (list of floats): bounding box in format x1,y1,x2,y2.
-    Returns:
-        int: intersection-over-onion of bbox1, bbox2
-    """
-    bbox1 = [float(x) for x in bbox1]
-    bbox2 = [float(x) for x in bbox2]
-    (x0_1, y0_1, x1_1, y1_1) = bbox1
-    (x0_2, y0_2, x1_2, y1_2) = bbox2
-    # get the overlap rectangle
-    overlap_x0 = max(x0_1, x0_2)
-    overlap_y0 = max(y0_1, y0_2)
-    overlap_x1 = min(x1_1, x1_2)
-    overlap_y1 = min(y1_1, y1_2)
-    # check if there is an overlap
-    if overlap_x1 - overlap_x0 <= 0 or overlap_y1 - overlap_y0 <= 0:
-        return 0
-    # if yes, calculate the ratio of the overlap to each ROI size and the unified size
-    size_1 = (x1_1 - x0_1) * (y1_1 - y0_1)
-    size_2 = (x1_2 - x0_2) * (y1_2 - y0_2)
-    size_intersection = (overlap_x1 - overlap_x0) * (overlap_y1 - overlap_y0)
-    size_union = size_1 + size_2 - size_intersection
-    return size_intersection / size_union

OTVision/track/preprocess.py DELETED Viewed

@@ -1,453 +0,0 @@
-import re
-from dataclasses import dataclass
-from datetime import datetime, timedelta
-from pathlib import Path
-from typing import Any
-from OTVision import dataformat, version
-from OTVision.dataformat import (
-    CLASS,
-    CONFIDENCE,
-    DATA,
-    DATE_FORMAT,
-    DETECTIONS,
-    EXPECTED_DURATION,
-    FILENAME,
-    FRAME,
-    INPUT_FILE_PATH,
-    INTERPOLATED_DETECTION,
-    OCCURRENCE,
-    OTTRACK_VERSION,
-    RECORDED_START_DATE,
-    TRACK_ID,
-    VIDEO,
-    H,
-    W,
-    X,
-    Y,
-)
-from OTVision.helpers.date import (
-    parse_date_string_to_utc_datime,
-    parse_timestamp_string_to_utc_datetime,
-)
-from OTVision.helpers.files import (
-    FULL_FILE_NAME_PATTERN,
-    HOSTNAME,
-    InproperFormattedFilename,
-    read_json,
-    read_json_bz2_metadata,
-)
-MISSING_START_DATE = datetime(1900, 1, 1)
-MISSING_EXPECTED_DURATION = timedelta(minutes=15)
-def parse_datetime(date: str | float) -> datetime:
-    """Parse a date string or timestamp to a datetime with UTC as timezone.
-    Args:
-        date (str | float): the date to parse
-    Returns:
-        datetime: the parsed datetime object with UTC set as timezone
-    """
-    if isinstance(date, str) and ("-" in date):
-        return parse_date_string_to_utc_datime(date, DATE_FORMAT)
-    return parse_timestamp_string_to_utc_datetime(date)
-@dataclass(frozen=True, repr=True)
-class Detection:
-    """
-    Data class which contains information for a single detection.
-    """
-    label: str
-    conf: float
-    x: float
-    y: float
-    w: float
-    h: float
-    def to_dict(self, frame: int, occurrence: datetime, input_file_path: str) -> dict:
-        return {
-            CLASS: self.label,
-            CONFIDENCE: self.conf,
-            X: self.x,
-            Y: self.y,
-            W: self.w,
-            H: self.h,
-            FRAME: frame,
-            OCCURRENCE: occurrence.timestamp(),
-            INPUT_FILE_PATH: input_file_path,
-            INTERPOLATED_DETECTION: False,
-        }
-    def to_otdet(self) -> dict:
-        return {
-            CLASS: self.label,
-            CONFIDENCE: self.conf,
-            X: self.x,
-            Y: self.y,
-            W: self.w,
-            H: self.h,
-        }
-@dataclass(frozen=True)
-class Frame:
-    frame: int
-    occurrence: datetime
-    input_file_path: Path
-    detections: list[Detection]
-    def to_dict(self) -> dict:
-        return {
-            FRAME: self.frame,
-            OCCURRENCE: self.occurrence.timestamp(),
-            INPUT_FILE_PATH: self.input_file_path.as_posix(),
-            DETECTIONS: [
-                detection.to_dict(
-                    self.frame, self.occurrence, self.input_file_path.as_posix()
-                )
-                for detection in self.detections
-            ],
-        }
-    def derive_frame_number(self, new_frame_number: int) -> "Frame":
-        return Frame(
-            new_frame_number, self.occurrence, self.input_file_path, self.detections
-        )
-    def get_output_file(self, with_suffix: str) -> Path:
-        return self.input_file_path.with_suffix(with_suffix)
-class FrameGroup:
-    def __init__(
-        self,
-        start_date: datetime,
-        end_date: datetime,
-        hostname: str,
-        file: Path | None,
-        metadata: dict | None,
-    ) -> None:
-        self._files_metadata: dict[str, dict] = dict()
-        self._files: list[Path] = []
-        if (file is not None) and (metadata is not None):
-            self._files_metadata[file.as_posix()] = metadata
-            self._files.append(file)
-        self.hostname = hostname
-        self._start_date = start_date
-        self._end_date = end_date
-    @property
-    def files(self) -> list[Path]:
-        return self._files
-    def metadata_for(self, file: Path | str) -> dict:
-        if isinstance(file, str):
-            return self._files_metadata[file]
-        else:
-            return self._files_metadata[file.as_posix()]
-    def start_date(self) -> datetime:
-        return self._start_date
-    def end_date(self) -> datetime:
-        return self._end_date
-    def merge(self, other: "FrameGroup") -> "FrameGroup":
-        if self.start_date() < other.start_date():
-            return self._merge(self, other)
-        else:
-            return self._merge(other, self)
-    def _merge(self, first: "FrameGroup", second: "FrameGroup") -> "FrameGroup":
-        if first.hostname != second.hostname:
-            raise ValueError("Hostname of FrameGroups does not match")
-        merged = FrameGroup(
-            start_date=first._start_date,
-            end_date=second._end_date,
-            hostname=self.hostname,
-            file=None,
-            metadata=None,
-        )
-        merged._files_metadata.update(first._files_metadata)
-        merged._files_metadata.update(second._files_metadata)
-        merged._files += first.files
-        merged._files += second.files
-        return merged
-    def __repr__(self) -> str:
-        return self.__str__()
-    def __str__(self) -> str:
-        return f"{self._start_date} - {self._end_date}"
-    def update_metadata(self, tracker_data: dict[str, dict]) -> None:
-        for filepath in self.files:
-            metadata = self.metadata_for(filepath)
-            metadata[OTTRACK_VERSION] = version.ottrack_version()
-            metadata[dataformat.TRACKING] = {
-                dataformat.OTVISION_VERSION: version.otvision_version(),
-                dataformat.FIRST_TRACKED_VIDEO_START: self.start_date().timestamp(),
-                dataformat.LAST_TRACKED_VIDEO_END: self.end_date().timestamp(),
-                dataformat.TRACKER: tracker_data,
-            }
-@dataclass(frozen=True)
-class FrameChunk:
-    file: Path
-    frames: list[Frame]
-    def start_date(self) -> datetime:
-        return self.frames[0].occurrence
-    def end_date(self) -> datetime:
-        return self.frames[-1].occurrence
-    def last_frame_id(self) -> int:
-        return self.frames[-1].frame
-    def get_existing_output_files(self, with_suffix: str) -> list[Path]:
-        output_files = set(
-            [frame.get_output_file(with_suffix=with_suffix) for frame in self.frames]
-        )
-        existing_files = [file for file in output_files if file.is_file()]
-        return existing_files
-    def to_dict(self) -> dict:
-        return {
-            DATA: {frame.frame: frame.to_dict() for frame in self.frames},
-        }
-    def __repr__(self) -> str:
-        return self.__str__()
-    def __str__(self) -> str:
-        return str(self.file)
-class FrameIndexer:
-    def reindex(self, frames: dict[str, dict], frame_offset: int) -> list[dict]:
-        detections = []
-        for track in frames.values():
-            for detection in track.values():
-                # Take into account that consecutive tracks over more than one
-                # video must have their frame reset to one when splitting.
-                # This is done by taking the frame_offset into account.
-                detection[FRAME] = detection[FRAME] - frame_offset
-                detections.append(detection)
-        if len(detections) == 0:
-            return []
-        assert len({detection[INPUT_FILE_PATH] for detection in detections}) == 1
-        detections.sort(
-            key=lambda detection: (
-                detection[INPUT_FILE_PATH],
-                detection[FRAME],
-                detection[TRACK_ID],
-            )
-        )
-        return detections
-class DetectionParser:
-    def convert(self, data_detections: list[dict[str, str]]) -> list[Detection]:
-        detections: list[Detection] = []
-        for detection in data_detections:
-            detected_item = Detection(
-                detection[CLASS],
-                float(detection[CONFIDENCE]),
-                float(detection[X]),
-                float(detection[Y]),
-                float(detection[W]),
-                float(detection[H]),
-            )
-            detections.append(detected_item)
-        return detections
-class FrameChunkParser:
-    @staticmethod
-    def parse(
-        file_path: Path,
-        frame_offset: int = 0,
-    ) -> FrameChunk:
-        input: dict[int, dict[str, Any]] = read_json(file_path)[DATA]
-        return FrameChunkParser.convert(input, file_path, frame_offset)
-    @staticmethod
-    def convert(
-        input: dict[int, dict[str, Any]],
-        file_path: Path,
-        frame_offset: int = 0,
-    ) -> FrameChunk:
-        detection_parser = DetectionParser()
-        frames: list[Frame] = []
-        for key, value in input.items():
-            occurrence: datetime = parse_datetime(value[OCCURRENCE])
-            data_detections = value[DETECTIONS]
-            detections = detection_parser.convert(data_detections)
-            parsed_frame = Frame(
-                int(key) + frame_offset,
-                occurrence=occurrence,
-                input_file_path=file_path,
-                detections=detections,
-            )
-            frames.append(parsed_frame)
-        frames.sort(key=lambda frame: (frame.occurrence, frame.frame))
-        return FrameChunk(file_path, frames)
-class Preprocess:
-    """Preprocess otdet file metadata (recording time interval) before running track.
-    Input files belonging to the same recording will be merged together.
-    The time gap to separate two recordings from each other is defined by
-    `self.time_without_frames`.
-    Returns:
-        Preprocess: preprocessor for tracking
-    """
-    def __init__(self, time_without_frames: timedelta = timedelta(minutes=1)) -> None:
-        self.time_without_frames = time_without_frames
-    def run(self, files: list[Path]) -> list[FrameGroup]:
-        """Read metadata of all input files,
-        parse the content and merge the frame groups belonging together.
-        Args:
-            files (list[Path]): list of input files
-        Returns:
-            list[FrameGroup]: merged frame groups sorted by start date
-        """
-        groups = self.process(self._read_input(files))
-        return sorted(groups, key=lambda r: r.start_date())
-    def process(self, input: dict[Path, dict]) -> list[FrameGroup]:
-        """Process given otdet files:
-        Create FrameGroup for each file then merge frame groups belonging together.
-        Args:
-            files (list[Path]): list of file paths
-        Returns:
-            list[FrameGroup]: parsed and merged frame groups
-        """
-        all_groups = [
-            self._parse_frame_group(path, metadata) for path, metadata in input.items()
-        ]
-        if len(all_groups) == 0:
-            return []
-        return self._merge_groups(all_groups)
-    def _read_input(self, files: list[Path]) -> dict[Path, dict]:
-        return {path: read_json_bz2_metadata(path) for path in files}
-    def _parse_frame_group(self, file_path: Path, metadata: dict) -> FrameGroup:
-        """Read and parse metadata of the given file to a FrameGroup
-        covering the recording time interval defined by:
-        - the recorded start date and
-        - the expected duration given in the metadata
-        Args:
-            file_path (Path): path of otdet file
-            metadata (dict): metadata of otdet file
-        Returns:
-            list[FrameGroup]: parsed input and metadata per file
-        """
-        start_date: datetime = self.extract_start_date_from(metadata)
-        duration: timedelta = self.extract_expected_duration_from(metadata)
-        end_date: datetime = start_date + duration
-        hostname = self.get_hostname(metadata)
-        return FrameGroup(
-            start_date=start_date,
-            end_date=end_date,
-            file=file_path,
-            metadata=metadata,
-            hostname=hostname,
-        )
-    @staticmethod
-    def get_hostname(file_metadata: dict) -> str:
-        """Retrieve hostname from the given file metadata.
-        Args:
-            file_metadata (dict): metadata content.
-        Raises:
-            InproperFormattedFilename: if the filename is not formatted as expected, an
-                exception will be raised.
-        Returns:
-            str: the hostname
-        """
-        video_name = Path(file_metadata[VIDEO][FILENAME]).name
-        match = re.search(
-            FULL_FILE_NAME_PATTERN,
-            video_name,
-        )
-        if match:
-            return match.group(HOSTNAME)
-        raise InproperFormattedFilename(
-            f"Could not parse {video_name} with pattern: {FULL_FILE_NAME_PATTERN}."
-        )
-    def _merge_groups(self, all_groups: list[FrameGroup]) -> list[FrameGroup]:
-        """Merge frame groups whose start and end times are close to each other. Close
-        is defined by `self.time_without_frames`.
-        Args:
-            all_groups (list[FrameGroup]): list of frame groups to merge
-        Returns:
-            list[FrameGroup]: list of merged frame groups
-        """
-        assert len(all_groups) >= 1
-        merged_groups = []
-        sorted_groups = sorted(all_groups, key=lambda group: group.start_date())
-        last_group = sorted_groups[0]
-        for current_group in sorted_groups[1:]:
-            if last_group.hostname != current_group.hostname:
-                merged_groups.append(last_group)
-                last_group = current_group
-            elif (
-                timedelta(seconds=0)
-                <= (current_group.start_date() - last_group.end_date())
-                <= self.time_without_frames
-            ):
-                last_group = last_group.merge(current_group)
-            else:
-                merged_groups.append(last_group)
-                last_group = current_group
-        merged_groups.append(last_group)
-        return merged_groups
-    def extract_start_date_from(self, metadata: dict) -> datetime:
-        if RECORDED_START_DATE in metadata[VIDEO].keys():
-            recorded_start_date = metadata[VIDEO][RECORDED_START_DATE]
-            return parse_datetime(recorded_start_date)
-        return MISSING_START_DATE
-    def extract_expected_duration_from(self, metadata: dict) -> timedelta:
-        if EXPECTED_DURATION in metadata[VIDEO].keys():
-            expected_duration = metadata[VIDEO][EXPECTED_DURATION]
-            return timedelta(seconds=int(expected_duration))
-        return MISSING_EXPECTED_DURATION

{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{otvision-0.6.0.dist-info → otvision-0.6.2.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

OTVision 0.6.0__py3-none-any.whl → 0.6.2__py3-none-any.whl

OTVision 0.6.0py3-none-any.whl → 0.6.2py3-none-any.whl