PyPI - supervisely - Versions diffs - 6.73.321__py3-none-any.whl → 6.73.322__py3-none-any.whl - Mend

supervisely 6.73.321py3-none-any.whl → 6.73.322py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

supervisely/convert/base_converter.py CHANGED Viewed

@@ -65,6 +65,7 @@ class AvailablePointcloudEpisodesConverters:
     SLY = "supervisely"
     BAG = "rosbag"
     LYFT = "lyft"
+    KITTI360 = "kitti360"
 class AvailableVolumeConverters:

supervisely/convert/pointcloud_episodes/__init__.py CHANGED Viewed

@@ -7,3 +7,4 @@ from supervisely.convert.pointcloud_episodes.lyft.lyft_converter import LyftEpis
 from supervisely.convert.pointcloud_episodes.nuscenes_conv.nuscenes_converter import (
     NuscenesEpisodesConverter,
 )
+from supervisely.convert.pointcloud_episodes.kitti_360.kitti_360_converter import KITTI360Converter

supervisely/convert/pointcloud_episodes/kitti_360/__init__.py ADDED Viewed

File without changes

supervisely/convert/pointcloud_episodes/kitti_360/kitti_360_converter.py ADDED Viewed

@@ -0,0 +1,242 @@
+import os
+from pathlib import Path
+from typing import Optional, List
+from supervisely import PointcloudEpisodeAnnotation, ProjectMeta, is_development, logger, ObjClass, ObjClassCollection
+from supervisely.geometry.cuboid_3d import Cuboid3d
+from supervisely.api.api import Api, ApiField
+from supervisely.convert.base_converter import AvailablePointcloudEpisodesConverters
+from supervisely.convert.pointcloud_episodes.kitti_360.kitti_360_helper import *
+from supervisely.convert.pointcloud_episodes.pointcloud_episodes_converter import PointcloudEpisodeConverter
+from supervisely.io.fs import (
+    file_exists,
+    get_file_name,
+    get_file_name_with_ext,
+    list_files_recursively,
+    silent_remove,
+)
+from supervisely.pointcloud_annotation.pointcloud_episode_frame_collection import PointcloudEpisodeFrameCollection
+from supervisely.pointcloud_annotation.pointcloud_episode_object_collection import PointcloudEpisodeObjectCollection
+from supervisely.pointcloud_annotation.pointcloud_episode_object import PointcloudEpisodeObject
+from supervisely.pointcloud_annotation.pointcloud_episode_frame import PointcloudEpisodeFrame
+from supervisely.pointcloud_annotation.pointcloud_figure import PointcloudFigure
+class KITTI360Converter(PointcloudEpisodeConverter):
+    class Item:
+        def __init__(
+            self,
+            scene_name: str,
+            frame_paths: List[str],
+            ann_data: Annotation3D,
+            poses_path: str,
+            related_images: Optional[tuple] = None,
+            custom_data: Optional[dict] = None,
+        ):
+            self._scene_name = scene_name
+            self._frame_paths = frame_paths
+            self._ann_data = ann_data
+            self._poses_path = poses_path
+            self._related_images = related_images or []
+            self._type = "point_cloud_episode"
+            self._custom_data = custom_data if custom_data is not None else {}
+    def __init__(self, *args, **kwargs):
+        self._calib_path = None
+        super().__init__(*args, **kwargs)
+    def __str__(self) -> str:
+        return AvailablePointcloudEpisodesConverters.KITTI360
+    @property
+    def key_file_ext(self) -> str:
+        return ".bin"
+    def validate_format(self) -> bool:
+        try:
+            import kitti360scripts
+        except ImportError:
+            logger.warn("Please run 'pip install kitti360Scripts' to import KITTI-360 data.")
+            return False
+        self._items = []
+        subdirs = os.listdir(self._input_data)
+        if len(subdirs) == 1:
+            self._input_data = os.path.join(self._input_data, subdirs[0])
+        # * Get calibration path
+        calib_dir = next(iter([(Path(path).parent).as_posix() for path in list_files_recursively(self._input_data, [".txt"], None, True) if Path(path).stem.startswith("calib")]), None)
+        if calib_dir is None:
+            return False
+        self._calib_path = calib_dir
+        # * Get pointcloud files paths
+        velodyne_files = list_files_recursively(self._input_data, [".bin"], None, True)
+        if len(velodyne_files) == 0:
+            return False
+        # * Get annotation files paths and related images
+        boxes_ann_files = list_files_recursively(self._input_data, [".xml"], None, True)
+        if len(boxes_ann_files) == 0:
+            return False
+        rimage_files = list_files_recursively(self._input_data, [".png"], None, True)
+        kitti_anns = []
+        for ann_file in boxes_ann_files:
+            key_name = Path(ann_file).stem
+            # * Get pointcloud files
+            frame_paths = []
+            for path in velodyne_files:
+                if key_name in Path(path).parts:
+                    frame_paths.append(path)
+            if len(frame_paths) == 0:
+                logger.warn("No frames found for name: %s", key_name)
+                continue
+            # * Get related images
+            rimages = []
+            for rimage in rimage_files:
+                path = Path(rimage)
+                if key_name in path.parts:
+                    cam_name = path.parts[-3]
+                    rimages.append((cam_name, rimage))
+            # * Get poses
+            poses_filter = (
+                lambda x: x.endswith("cam0_to_world.txt") and key_name in Path(x).parts
+            )
+            poses_path = next(
+                path
+                for path in list_files_recursively(self._input_data, [".txt"], None, True)
+                if poses_filter(path)
+            )
+            if poses_path is None:
+                logger.warn("No poses found for name: %s", key_name)
+                continue
+            # * Parse annotation
+            ann = Annotation3D(ann_file)
+            kitti_anns.append(ann)
+            self._items.append(
+                self.Item(key_name, frame_paths, ann, poses_path, rimages)
+            )
+        # * Get object class names for meta
+        obj_class_names = set()
+        for ann in kitti_anns:
+            for obj in ann.get_objects():
+                obj_class_names.add(obj.name)
+        obj_classes = [ObjClass(obj_class, Cuboid3d) for obj_class in obj_class_names]
+        self._meta = ProjectMeta(obj_classes=ObjClassCollection(obj_classes))
+        return self.items_count > 0
+    def to_supervisely(
+        self,
+        item,
+        meta: ProjectMeta,
+        renamed_classes: dict = {},
+        renamed_tags: dict = {},
+        static_transformations: StaticTransformations = None,
+    ) -> PointcloudEpisodeAnnotation:
+        static_transformations.set_cam2world(item._poses_path)
+        frame_cnt = len(item._frame_paths)
+        objs, frames = [], []
+        frame_idx_to_figures = {idx: [] for idx in range(frame_cnt)}
+        for obj in item._ann_data.get_objects():
+            pcd_obj = PointcloudEpisodeObject(meta.get_obj_class(obj.name))
+            objs.append(pcd_obj)
+            for idx in range(frame_cnt):
+                if obj.start_frame <= idx <= obj.end_frame:
+                    tr_matrix = static_transformations.world_to_velo_transformation(obj, idx)
+                    geom = convert_kitti_cuboid_to_supervisely_geometry(tr_matrix)
+                    frame_idx_to_figures[idx].append(PointcloudFigure(pcd_obj, geom, idx))
+        for idx, figures in frame_idx_to_figures.items():
+            frame = PointcloudEpisodeFrame(idx, figures)
+            frames.append(frame)
+        obj_collection = PointcloudEpisodeObjectCollection(objs)
+        frame_collection = PointcloudEpisodeFrameCollection(frames)
+        return PointcloudEpisodeAnnotation(
+            frame_cnt, objects=obj_collection, frames=frame_collection
+        )
+    def upload_dataset(self, api: Api, dataset_id: int, batch_size: int = 1, log_progress=True):
+        meta, renamed_classes, renamed_tags = self.merge_metas_with_conflicts(api, dataset_id)
+        dataset_info = api.dataset.get_info_by_id(dataset_id)
+        if log_progress:
+            progress, progress_cb = self.get_progress(sum([len(item._frame_paths) for item in self._items]), "Converting pointcloud episodes...")
+        else:
+            progress_cb = None
+        static_transformations = StaticTransformations(self._calib_path)
+        scene_ds = dataset_info
+        multiple_items = self.items_count > 1
+        for item in self._items:
+            scene_ds = api.dataset.create(dataset_info.project_id, item._scene_name, parent_id=dataset_id) if multiple_items else dataset_info
+            frame_to_pcd_ids = {}
+            for idx, frame_path in enumerate(item._frame_paths):
+                # * Convert pointcloud from ".bin" to ".pcd"
+                pcd_path = str(Path(frame_path).with_suffix(".pcd"))
+                if file_exists(pcd_path):
+                    logger.warning(f"Overwriting file with path: {pcd_path}")
+                convert_bin_to_pcd(frame_path, pcd_path)
+                # * Upload pointcloud
+                pcd_name = get_file_name_with_ext(pcd_path)
+                info = api.pointcloud_episode.upload_path(scene_ds.id, pcd_name, pcd_path, {"frame": idx})
+                pcd_id = info.id
+                frame_to_pcd_ids[idx] = pcd_id
+                # * Clean up
+                silent_remove(pcd_path)
+                if log_progress:
+                    progress_cb(1)
+            # * Upload photocontext
+            rimage_jsons = []
+            cam_names = []
+            hashes = api.pointcloud_episode.upload_related_images(
+                [rimage_path for _, rimage_path in item._related_images]
+            )
+            for (cam_name, rimage_path), img, pcd_id in zip(
+                item._related_images, hashes, list(frame_to_pcd_ids.values())
+            ):
+                cam_num = int(cam_name[-1])
+                rimage_info = convert_calib_to_image_meta(
+                    get_file_name(rimage_path), static_transformations, cam_num
+                )
+                image_json = {
+                    ApiField.ENTITY_ID: pcd_id,
+                    ApiField.NAME: cam_name,
+                    ApiField.HASH: img,
+                    ApiField.META: rimage_info[ApiField.META],
+                }
+                rimage_jsons.append(image_json)
+                cam_names.append(cam_name)
+            if rimage_jsons:
+                api.pointcloud_episode.add_related_images(rimage_jsons, cam_names)
+            # * Convert annotation and upload
+            try:
+                ann = self.to_supervisely(
+                    item, meta, renamed_classes, renamed_tags, static_transformations
+                )
+                api.pointcloud_episode.annotation.append(scene_ds.id, ann, frame_to_pcd_ids)
+            except Exception as e:
+                logger.error(
+                    f"Failed to upload annotation for scene: {scene_ds.name}. Error: {repr(e)}",
+                    stack_info=False,
+                )
+                continue
+            logger.info(f"Dataset ID:{scene_ds.id} has been successfully uploaded.")
+        if log_progress:
+            if is_development():
+                progress.close()

supervisely/convert/pointcloud_episodes/kitti_360/kitti_360_helper.py ADDED Viewed

@@ -0,0 +1,386 @@
+from supervisely import logger
+from supervisely.io.fs import get_file_name
+from supervisely.geometry.cuboid_3d import Cuboid3d
+from supervisely.geometry.point_3d import Vector3d
+from supervisely.geometry.point import Point
+from collections import defaultdict
+import os
+import numpy as np
+MAX_N = 1000
+def local2global(semanticId, instanceId):
+    globalId = semanticId * MAX_N + instanceId
+    if isinstance(globalId, np.ndarray):
+        return globalId.astype(np.int)
+    else:
+        return int(globalId)
+def global2local(globalId):
+    semanticId = globalId // MAX_N
+    instanceId = globalId % MAX_N
+    if isinstance(globalId, np.ndarray):
+        return semanticId.astype(int), instanceId.astype(int)
+    else:
+        return int(semanticId), int(instanceId)
+annotation2global = defaultdict()
+# Abstract base class for annotation objects
+class KITTI360Object:
+    from abc import ABCMeta
+    __metaclass__ = ABCMeta
+    def __init__(self):
+        from matplotlib import cm
+        # the label
+        self.label = ""
+        # colormap
+        self.cmap = cm.get_cmap("Set1")
+        self.cmap_length = 9
+    def getColor(self, idx):
+        if idx == 0:
+            return np.array([0, 0, 0])
+        return np.asarray(self.cmap(idx % self.cmap_length)[:3]) * 255.0
+    # def assignColor(self):
+    #     from kitti360scripts.helpers.labels import id2label  # pylint: disable=import-error
+    #     if self.semanticId >= 0:
+    #         self.semanticColor = id2label[self.semanticId].color
+    #         if self.instanceId > 0:
+    #             self.instanceColor = self.getColor(self.instanceId)
+    #         else:
+    #             self.instanceColor = self.semanticColor
+# Class that contains the information of a single annotated object as 3D bounding box
+class KITTI360Bbox3D(KITTI360Object):
+    # Constructor
+    def __init__(self):
+        KITTI360Object.__init__(self)
+        # the polygon as list of points
+        self.vertices = []
+        self.faces = []
+        self.lines = [
+            [0, 5],
+            [1, 4],
+            [2, 7],
+            [3, 6],
+            [0, 1],
+            [1, 3],
+            [3, 2],
+            [2, 0],
+            [4, 5],
+            [5, 7],
+            [7, 6],
+            [6, 4],
+        ]
+        # the ID of the corresponding object
+        self.semanticId = -1
+        self.instanceId = -1
+        self.annotationId = -1
+        # the window that contains the bbox
+        self.start_frame = -1
+        self.end_frame = -1
+        # timestamp of the bbox (-1 if statis)
+        self.timestamp = -1
+        # projected vertices
+        self.vertices_proj = None
+        self.meshes = []
+        # name
+        self.name = ""
+    def __str__(self):
+        return self.name
+    # def generateMeshes(self):
+    #     self.meshes = []
+    #     if self.vertices_proj:
+    #         for fidx in range(self.faces.shape[0]):
+    #             self.meshes.append(
+    #                 [
+    #                     Point(self.vertices_proj[0][int(x)], self.vertices_proj[1][int(x)])
+    #                     for x in self.faces[fidx]
+    #                 ]
+    #             )
+    def parseOpencvMatrix(self, node):
+        rows = int(node.find("rows").text)
+        cols = int(node.find("cols").text)
+        data = node.find("data").text.split(" ")
+        mat = []
+        for d in data:
+            d = d.replace("\n", "")
+            if len(d) < 1:
+                continue
+            mat.append(float(d))
+        mat = np.reshape(mat, [rows, cols])
+        return mat
+    def parseVertices(self, child):
+        transform = self.parseOpencvMatrix(child.find("transform"))
+        R = transform[:3, :3]
+        T = transform[:3, 3]
+        vertices = self.parseOpencvMatrix(child.find("vertices"))
+        faces = self.parseOpencvMatrix(child.find("faces"))
+        vertices = np.matmul(R, vertices.transpose()).transpose() + T
+        self.vertices = vertices
+        self.faces = faces
+        self.R = R
+        self.T = T
+        self.transform = transform
+    def parseBbox(self, child):
+        from kitti360scripts.helpers.labels import kittiId2label  # pylint: disable=import-error
+        semanticIdKITTI = int(child.find("semanticId").text)
+        self.semanticId = kittiId2label[semanticIdKITTI].id
+        self.instanceId = int(child.find("instanceId").text)
+        # self.name = str(child.find('label').text)
+        self.name = kittiId2label[semanticIdKITTI].name
+        self.start_frame = int(child.find("start_frame").text)
+        self.end_frame = int(child.find("end_frame").text)
+        self.timestamp = int(child.find("timestamp").text)
+        self.annotationId = int(child.find("index").text) + 1
+        global annotation2global
+        annotation2global[self.annotationId] = local2global(self.semanticId, self.instanceId)
+        self.parseVertices(child)
+    def parseStuff(self, child):
+        from kitti360scripts.helpers.labels import name2label  # pylint: disable=import-error
+        classmap = {
+            "driveway": "parking",
+            "ground": "terrain",
+            "unknownGround": "ground",
+            "railtrack": "rail track",
+        }
+        label = child.find("label").text
+        if label in classmap.keys():
+            label = classmap[label]
+        self.start_frame = int(child.find("start_frame").text)
+        self.end_frame = int(child.find("end_frame").text)
+        self.semanticId = name2label[label].id
+        self.instanceId = 0
+        self.parseVertices(child)
+# Class that contains the information of the point cloud a single frame
+class KITTI360Point3D(KITTI360Object):
+    # Constructor
+    def __init__(self):
+        KITTI360Object.__init__(self)
+        self.vertices = []
+        self.vertices_proj = None
+        # the ID of the corresponding object
+        self.semanticId = -1
+        self.instanceId = -1
+        self.annotationId = -1
+        # name
+        self.name = ""
+        # color
+        self.semanticColor = None
+        self.instanceColor = None
+    def __str__(self):
+        return self.name
+    # def generateMeshes(self):
+    #     pass
+# Meta class for KITTI360Bbox3D
+class Annotation3D:
+    def __init__(self, labelPath):
+        from kitti360scripts.helpers.labels import labels  # pylint: disable=import-error
+        import xml.etree.ElementTree as ET
+        key_name = get_file_name(labelPath)
+        # load annotation
+        tree = ET.parse(labelPath)
+        root = tree.getroot()
+        self.objects = defaultdict(dict)
+        self.num_bbox = 0
+        for child in root:
+            if child.find("transform") is None:
+                continue
+            obj = KITTI360Bbox3D()
+            obj.parseBbox(child)
+            globalId = local2global(obj.semanticId, obj.instanceId)
+            self.objects[globalId][obj.timestamp] = obj
+            self.num_bbox += 1
+        globalIds = np.asarray(list(self.objects.keys()))
+        semanticIds, instanceIds = global2local(globalIds)
+        for label in labels:
+            if label.hasInstances:
+                print(f"{label.name:<30}:\t {(semanticIds==label.id).sum()}")
+        print(f"Loaded {len(globalIds)} instances")
+        print(f"Loaded {self.num_bbox} boxes")
+    def __call__(self, semanticId, instanceId, timestamp=None):
+        globalId = local2global(semanticId, instanceId)
+        if globalId in self.objects.keys():
+            # static object
+            if len(self.objects[globalId].keys()) == 1:
+                if -1 in self.objects[globalId].keys():
+                    return self.objects[globalId][-1]
+                else:
+                    return None
+            # dynamic object
+            else:
+                return self.objects[globalId][timestamp]
+        else:
+            return None
+    def get_objects(self):
+        return [list(obj.values())[0] for obj in self.objects.values()]
+class StaticTransformations:
+    def __init__(self, calibrations_path):
+        import kitti360scripts.devkits.commons.loadCalibration as lc  # pylint: disable=import-error
+        cam2velo_path = os.path.join(calibrations_path, "calib_cam_to_velo.txt")
+        self.cam2velo = lc.loadCalibrationRigid(cam2velo_path)
+        perspective_path = os.path.join(calibrations_path, "perspective.txt")
+        self.intrinsic_calibrations = lc.loadPerspectiveIntrinsic(perspective_path)
+        self.cam2world = None
+    def set_cam2world(self, cam2world_path):
+        if not os.path.isfile(cam2world_path):
+            logger.warn("Camera to world calibration file was not found")
+            return
+        cam2world_rows = np.loadtxt(cam2world_path)
+        cam2world_rigid = np.reshape(cam2world_rows[:, 1:], (-1, 4, 4))
+        frames_numbers = list(np.reshape(cam2world_rows[:, :1], (-1)).astype(int))
+        cam2world = {}
+        current_rigid = cam2world_rigid[0]
+        for frame_index in range(0, frames_numbers[-1]):
+            if frame_index in frames_numbers:
+                mapped_index = frames_numbers.index(frame_index)
+                current_rigid = cam2world_rigid[mapped_index]
+            # (Tr(cam -> world))
+            cam2world[frame_index] = current_rigid
+        self.cam2world = cam2world
+    def world_to_velo_transformation(self, obj, frame_index):
+        # rotate_z = Rotation.from_rotvec(np.pi * np.array([0, 0, 1])).as_matrix()
+        # rotate_z = np.hstack((rotate_z, np.asarray([[0, 0, 0]]).T))
+        # tr0(local -> fixed_coordinates_local)
+        tr0 = np.asarray([[0, -1, 0, 0], [1, 0, 0, 0], [0, 0, 1, 0], [0, 0, 0, 1]])
+        # tr0(fixed_coordinates_local -> world)
+        tr1 = obj.transform
+        # tr2(world -> cam)
+        tr2 = np.linalg.inv(self.cam2world[frame_index])
+        # tr3(world -> cam)
+        tr3 = self.cam2velo
+        return tr3 @ tr2 @ tr1 @ tr0
+    def get_extrinsic_matrix(self):
+        return np.linalg.inv(self.cam2velo)[:3, :4]
+    def get_intrinsics_matrix(self, camera_num):
+        try:
+            matrix = self.intrinsic_calibrations[f"P_rect_0{camera_num}"][:3, :3]
+            return matrix
+        except KeyError:
+            logger.warn(f"Camera {camera_num} intrinsic matrix was not found")
+        return
+def convert_kitti_cuboid_to_supervisely_geometry(tr_matrix):
+    import transforms3d  # pylint: disable=import-error
+    from scipy.spatial.transform.rotation import Rotation
+    Tdash, Rdash, Zdash, _ = transforms3d.affines.decompose44(tr_matrix)
+    x, y, z = Tdash[0], Tdash[1], Tdash[2]
+    position = Vector3d(x, y, z)
+    rotation_angles = Rotation.from_matrix(Rdash).as_euler("xyz", degrees=False)
+    r_x, r_y, r_z = rotation_angles[0], rotation_angles[1], rotation_angles[2]
+    # Invert the bbox by adding π to the yaw while maintaining its degree relative to the world
+    rotation = Vector3d(r_x, r_y, r_z + np.pi)
+    w, h, l = Zdash[0], Zdash[1], Zdash[2]
+    dimension = Vector3d(w, h, l)
+    return Cuboid3d(position, rotation, dimension)
+def convert_bin_to_pcd(src, dst):
+    import open3d as o3d  # pylint: disable=import-error
+    try:
+        bin = np.fromfile(src, dtype=np.float32).reshape(-1, 4)
+    except ValueError as e:
+        raise Exception(
+            f"Incorrect data in the KITTI 3D pointcloud file: {src}. "
+            f"There was an error while trying to reshape the data into a 4-column matrix: {e}. "
+            "Please ensure that the binary file contains a multiple of 4 elements to be "
+            "successfully reshaped into a (N, 4) array.\n"
+        )
+    points = bin[:, 0:3]
+    intensity = bin[:, -1]
+    intensity_fake_rgb = np.zeros((intensity.shape[0], 3))
+    intensity_fake_rgb[:, 0] = intensity
+    pc = o3d.geometry.PointCloud(o3d.utility.Vector3dVector(points))
+    pc.colors = o3d.utility.Vector3dVector(intensity_fake_rgb)
+    o3d.io.write_point_cloud(dst, pc)
+def convert_calib_to_image_meta(image_name, static, cam_num):
+    intrinsic_matrix = static.get_intrinsics_matrix(cam_num)
+    extrinsic_matrix = static.get_extrinsic_matrix()
+    data = {
+        "name": image_name,
+        "meta": {
+            "deviceId": cam_num,
+            "sensorsData": {
+                "extrinsicMatrix": list(extrinsic_matrix.flatten().astype(float)),
+                "intrinsicMatrix": list(intrinsic_matrix.flatten().astype(float)),
+            },
+        },
+    }
+    return data

supervisely/nn/inference/inference.py CHANGED Viewed

@@ -1347,6 +1347,7 @@ class Inference:
                 source=images_np,
                 settings=settings,
             )
+            anns = self._exclude_duplicated_predictions(api, anns, settings, dataset_id, ids)
             results.extend(self._format_output(anns, slides_data))
         return results
@@ -1395,6 +1396,10 @@ class Inference:
                 )
                 self.cache.set_project_meta(output_project_id, output_project_meta)
+            ann = self._exclude_duplicated_predictions(
+                api, anns, settings, ds_info.id, [image_id], output_project_meta
+            )[0]
             logger.debug(
                 "Uploading annotation...",
                 extra={
@@ -1404,6 +1409,10 @@ class Inference:
                 },
             )
             api.annotation.upload_ann(image_id, ann)
+        else:
+            ann = self._exclude_duplicated_predictions(
+                api, anns, settings, image_info.dataset_id, [image_id]
+            )[0]
         result = self._format_output(anns, slides_data)[0]
         if async_inference_request_uuid is not None and ann is not None:
@@ -1786,6 +1795,15 @@ class Inference:
                 batch_results = []
                 for i, ann in enumerate(anns):
                     image_info: ImageInfo = images_infos_dict[image_ids_batch[i]]
+                    ds_info = dataset_infos_dict[image_info.dataset_id]
+                    meta = output_project_metas_dict.get(ds_info.project_id, None)
+                    iou = settings.get("existing_objects_iou_thresh")
+                    if meta is None and isinstance(iou, float) and iou > 0:
+                        meta = ProjectMeta.from_json(api.project.get_meta(ds_info.project_id))
+                        output_project_metas_dict[ds_info.project_id] = meta
+                    ann = self._exclude_duplicated_predictions(
+                        api, [ann], settings, ds_info.id, [image_info.id], meta
+                    )[0]
                     batch_results.append(
                         {
                             "annotation": ann.to_json(),
@@ -2086,6 +2104,19 @@ class Inference:
                         source=images_nps,
                         settings=settings,
                     )
+                    iou = settings.get("existing_objects_iou_thresh")
+                    if output_project_meta is None and isinstance(iou, float) and iou > 0:
+                        output_project_meta = ProjectMeta.from_json(
+                            api.project.get_meta(project_info.id)
+                        )
+                    anns = self._exclude_duplicated_predictions(
+                        api,
+                        anns,
+                        settings,
+                        dataset_info.id,
+                        [ii.id for ii in images_infos_batch],
+                        output_project_meta,
+                    )
                     batch_results = []
                     for i, ann in enumerate(anns):
                         batch_results.append(
@@ -2935,7 +2966,9 @@ class Inference:
         parser = argparse.ArgumentParser(description="Run Inference Serving")
         # Positional args
-        parser.add_argument("mode", nargs="?", type=str, help="Mode of operation: 'deploy' or 'predict'")
+        parser.add_argument(
+            "mode", nargs="?", type=str, help="Mode of operation: 'deploy' or 'predict'"
+        )
         parser.add_argument("input", nargs="?", type=str, help="Local path to input data")
         # Deploy args
@@ -3459,6 +3492,127 @@ class Inference:
                 f"Checkpoint {checkpoint_url} not found in Team Files. Cannot set workflow input"
             )
+    def _exclude_duplicated_predictions(
+        self,
+        api: Api,
+        pred_anns: List[Annotation],
+        settings: dict,
+        dataset_id: int,
+        gt_image_ids: List[int],
+        meta: Optional[ProjectMeta] = None,
+    ):
+        """
+        Filter out predictions that significantly overlap with ground truth (GT) objects.
+        This is a wrapper around the `_filter_duplicated_predictions_from_ann` method that does the following:
+        - Checks inference settings for the IoU threshold (`existing_objects_iou_thresh`)
+        - Gets ProjectMeta object if not provided
+        - Downloads GT annotations for the specified image IDs
+        - Filters out predictions that have an IoU greater than or equal to the specified threshold with any GT object
+        :param api: Supervisely API object
+        :type api: Api
+        :param pred_anns: List of Annotation objects containing predictions
+        :type pred_anns: List[Annotation]
+        :param settings: Inference settings
+        :type settings: dict
+        :param dataset_id: ID of the dataset containing the images
+        :type dataset_id: int
+        :param gt_image_ids: List of image IDs to filter predictions. All images should belong to the same dataset
+        :type gt_image_ids: List[int]
+        :param meta: ProjectMeta object
+        :type meta: Optional[ProjectMeta]
+        :return: List of Annotation objects containing filtered predictions
+        :rtype: List[Annotation]
+        Notes:
+        ------
+        - Requires PyTorch and torchvision for IoU calculations
+        - This method is useful for identifying new objects that aren't already annotated in the ground truth
+        """
+        iou = settings.get("existing_objects_iou_thresh")
+        if isinstance(iou, float) and 0 < iou <= 1:
+            if meta is None:
+                ds = api.dataset.get_info_by_id(dataset_id)
+                meta = ProjectMeta.from_json(api.project.get_meta(ds.project_id))
+            gt_anns = api.annotation.download_json_batch(dataset_id, gt_image_ids)
+            gt_anns = [Annotation.from_json(ann, meta) for ann in gt_anns]
+            for i in range(0, len(pred_anns)):
+                before = len(pred_anns[i].labels)
+                with Timer() as timer:
+                    pred_anns[i] = self._filter_duplicated_predictions_from_ann(
+                        gt_anns[i], pred_anns[i], iou
+                    )
+                after = len(pred_anns[i].labels)
+                logger.debug(
+                    f"{[i]}: applied NMS with IoU={iou}. Before: {before}, After: {after}. Time: {timer.get_time():.3f}ms"
+                )
+        return pred_anns
+    def _filter_duplicated_predictions_from_ann(
+        self, gt_ann: Annotation, pred_ann: Annotation, iou_threshold: float
+    ) -> Annotation:
+        """
+        Filter out predictions that significantly overlap with ground truth annotations.
+        This function compares each prediction with ground truth annotations of the same class
+        and removes predictions that have an IoU (Intersection over Union) greater than or equal
+        to the specified threshold with any ground truth annotation. This is useful for identifying
+        new objects that aren't already annotated in the ground truth.
+        :param gt_ann: Annotation object containing ground truth labels
+        :type gt_ann: Annotation
+        :param pred_ann: Annotation object containing prediction labels to be filtered
+        :type pred_ann: Annotation
+        :param iou_threshold:   IoU threshold (0.0-1.0). Predictions with IoU >= threshold with any
+                                ground truth box of the same class will be removed
+        :type iou_threshold: float
+        :return: A new annotation object containing only predictions that don't significantly
+                 overlap with ground truth annotations
+        :rtype: Annotation
+        Notes:
+        ------
+        - Predictions with classes not present in ground truth will be kept
+        - Requires PyTorch and torchvision for IoU calculations
+        """
+        try:
+            import torch
+            from torchvision.ops import box_iou
+        except ImportError:
+            raise ImportError("Please install PyTorch and torchvision to use this feature.")
+        def _to_tensor(geom):
+            return torch.tensor([geom.left, geom.top, geom.right, geom.bottom]).float()
+        new_labels = []
+        pred_cls_bboxes = defaultdict(list)
+        for label in pred_ann.labels:
+            pred_cls_bboxes[label.obj_class.name].append(label)
+        gt_cls_bboxes = defaultdict(list)
+        for label in gt_ann.labels:
+            if label.obj_class.name not in pred_cls_bboxes:
+                continue
+            gt_cls_bboxes[label.obj_class.name].append(label)
+        for name, pred in pred_cls_bboxes.items():
+            gt = gt_cls_bboxes[name]
+            if len(gt) == 0:
+                new_labels.extend(pred)
+                continue
+            pred_bboxes = torch.stack([_to_tensor(l.geometry.to_bbox()) for l in pred]).float()
+            gt_bboxes = torch.stack([_to_tensor(l.geometry.to_bbox()) for l in gt]).float()
+            iou_matrix = box_iou(pred_bboxes, gt_bboxes)
+            iou_matrix = iou_matrix.cpu().numpy()
+            keep_indices = np.where(np.all(iou_matrix < iou_threshold, axis=1))[0]
+            new_labels.extend([pred[i] for i in keep_indices])
+        return pred_ann.clone(labels=new_labels)
 def _get_log_extra_for_inference_request(inference_request_uuid, inference_request: dict):
     log_extra = {

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: supervisely
-Version: 6.73.321
+Version: 6.73.322
 Summary: Supervisely Python SDK.
 Home-page: https://github.com/supervisely/supervisely
 Author: Supervisely

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/RECORD RENAMED Viewed

@@ -565,7 +565,7 @@ supervisely/collection/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3
 supervisely/collection/key_indexed_collection.py,sha256=x2UVlkprspWhhae9oLUzjTWBoIouiWY9UQSS_MozfH0,37643
 supervisely/collection/str_enum.py,sha256=Zp29yFGvnxC6oJRYNNlXhO2lTSdsriU1wiGHj6ahEJE,1250
 supervisely/convert/__init__.py,sha256=ropgB1eebG2bfLoJyf2jp8Vv9UkFujaW3jVX-71ho1g,1353
-supervisely/convert/base_converter.py,sha256=eCFnvyoMI96rWjB5amFPZX2fI_TSdr__ruqxwQIbfFo,18537
+supervisely/convert/base_converter.py,sha256=rRMIxY3h7cX5WAu_qn7w9vzRBcDB_jLZm5u_XQh7QG4,18563
 supervisely/convert/converter.py,sha256=tWxTDfFv7hwzQhUQrBxzfr6WP8FUGFX_ewg5T2HbUYo,8959
 supervisely/convert/image/__init__.py,sha256=JEuyaBiiyiYmEUYqdn8Mog5FVXpz0H1zFubKkOOm73I,1395
 supervisely/convert/image/image_converter.py,sha256=8vak8ZoKTN1ye2ZmCTvCZ605-Rw1AFLIEo7bJMfnR68,10426
@@ -634,10 +634,13 @@ supervisely/convert/pointcloud/ply/ply_helper.py,sha256=YfLiV9m6a4NNEMs0J32dmMTL
 supervisely/convert/pointcloud/sly/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 supervisely/convert/pointcloud/sly/sly_pointcloud_converter.py,sha256=r56Rwil-55cRnd0sIePFGrf_xXa-lKQSfwhEUrjOquk,5070
 supervisely/convert/pointcloud/sly/sly_pointcloud_helper.py,sha256=kOluL97FfCFfIvnUE_FeN8iQLMlwdiMR5gayorOGDXw,3968
-supervisely/convert/pointcloud_episodes/__init__.py,sha256=tzrN8kKCpa-0PNp6s1uVIoGse_VKGb45KzCCUSYlH5Y,457
+supervisely/convert/pointcloud_episodes/__init__.py,sha256=LePLQFEjXwhXap2zOY9SVTbW_NMbxKYZKBjBdRLimKE,557
 supervisely/convert/pointcloud_episodes/pointcloud_episodes_converter.py,sha256=qULUzO96BvWgNVmyxSQ0pUPBPG3WHgUJuK_U7Z8NM-g,9428
 supervisely/convert/pointcloud_episodes/bag/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 supervisely/convert/pointcloud_episodes/bag/bag_converter.py,sha256=jzWKXoFUWu11d5WlPfT1hphCubYpq_lhQZmhh07xZdQ,1659
+supervisely/convert/pointcloud_episodes/kitti_360/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+supervisely/convert/pointcloud_episodes/kitti_360/kitti_360_converter.py,sha256=ls3Pgf9WYTtaTzf6nLCL3gMjG6zZ_EAVKE5OJSFAOPc,10033
+supervisely/convert/pointcloud_episodes/kitti_360/kitti_360_helper.py,sha256=EHyJTRfIpUC3lETJOCTI_OY4ddmT0eTFLMMhOvSeCm0,12372
 supervisely/convert/pointcloud_episodes/lyft/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 supervisely/convert/pointcloud_episodes/lyft/lyft_converter.py,sha256=QXreWUJ-QhoWgLPqRxCayatYCCCuSV6Z2XCZKScrD3o,10419
 supervisely/convert/pointcloud_episodes/nuscenes_conv/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -876,7 +879,7 @@ supervisely/nn/benchmark/visualization/widgets/table/__init__.py,sha256=47DEQpj8
 supervisely/nn/benchmark/visualization/widgets/table/table.py,sha256=atmDnF1Af6qLQBUjLhK18RMDKAYlxnsuVHMSEa5a-e8,4319
 supervisely/nn/inference/__init__.py,sha256=QFukX2ip-U7263aEPCF_UCFwj6EujbMnsgrXp5Bbt8I,1623
 supervisely/nn/inference/cache.py,sha256=q4F7ZRzZghNWSVFClXEIHNMNW4PK6xddYckCFUgyhCo,32027
-supervisely/nn/inference/inference.py,sha256=RJPTCd-y5FtQ234Zdbj7D6stsR3ZpVo8GLpiXXAr2Bg,158665
+supervisely/nn/inference/inference.py,sha256=SqfIgohv0U3USQpHerzkrnfIeC7JKGeQA49Tocliu1k,165877
 supervisely/nn/inference/session.py,sha256=jmkkxbe2kH-lEgUU6Afh62jP68dxfhF5v6OGDfLU62E,35757
 supervisely/nn/inference/video_inference.py,sha256=8Bshjr6rDyLay5Za8IB8Dr6FURMO2R_v7aELasO8pR4,5746
 supervisely/nn/inference/gui/__init__.py,sha256=wCxd-lF5Zhcwsis-wScDA8n1Gk_1O00PKgDviUZ3F1U,221
@@ -1075,9 +1078,9 @@ supervisely/worker_proto/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZ
 supervisely/worker_proto/worker_api_pb2.py,sha256=VQfi5JRBHs2pFCK1snec3JECgGnua3Xjqw_-b3aFxuM,59142
 supervisely/worker_proto/worker_api_pb2_grpc.py,sha256=3BwQXOaP9qpdi0Dt9EKG--Lm8KGN0C5AgmUfRv77_Jk,28940
 supervisely_lib/__init__.py,sha256=7-3QnN8Zf0wj8NCr2oJmqoQWMKKPKTECvjH9pd2S5vY,159
-supervisely-6.73.321.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
-supervisely-6.73.321.dist-info/METADATA,sha256=yVJfg3OU_JHg5N-hBOHneb0i5S2tBLYZsVQ9sdn67Co,33596
-supervisely-6.73.321.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
-supervisely-6.73.321.dist-info/entry_points.txt,sha256=U96-5Hxrp2ApRjnCoUiUhWMqijqh8zLR03sEhWtAcms,102
-supervisely-6.73.321.dist-info/top_level.txt,sha256=kcFVwb7SXtfqZifrZaSE3owHExX4gcNYe7Q2uoby084,28
-supervisely-6.73.321.dist-info/RECORD,,
+supervisely-6.73.322.dist-info/LICENSE,sha256=xx0jnfkXJvxRnG63LTGOxlggYnIysveWIZ6H3PNdCrQ,11357
+supervisely-6.73.322.dist-info/METADATA,sha256=tXlMoMRbbXrc18yQVTx6Ti09xSaTCC4TyKgLUoNIC_U,33596
+supervisely-6.73.322.dist-info/WHEEL,sha256=P9jw-gEje8ByB7_hXoICnHtVCrEwMQh-630tKvQWehc,91
+supervisely-6.73.322.dist-info/entry_points.txt,sha256=U96-5Hxrp2ApRjnCoUiUhWMqijqh8zLR03sEhWtAcms,102
+supervisely-6.73.322.dist-info/top_level.txt,sha256=kcFVwb7SXtfqZifrZaSE3owHExX4gcNYe7Q2uoby084,28
+supervisely-6.73.322.dist-info/RECORD,,

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/LICENSE RENAMED Viewed

File without changes

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/WHEEL RENAMED Viewed

File without changes

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{supervisely-6.73.321.dist-info → supervisely-6.73.322.dist-info}/top_level.txt RENAMED Viewed

File without changes

supervisely 6.73.321__py3-none-any.whl → 6.73.322__py3-none-any.whl

supervisely 6.73.321py3-none-any.whl → 6.73.322py3-none-any.whl