PyPI - datamint - Versions diffs - 1.6.3.post1__py3-none-any.whl → 1.7.0__py3-none-any.whl - Mend

datamint 1.6.3.post1py3-none-any.whl → 1.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of datamint might be problematic. Click here for more details.

Files changed (10) hide show

datamint/apihandler/annotation_api_handler.py +125 -3
datamint/apihandler/base_api_handler.py +30 -26
datamint/apihandler/root_api_handler.py +121 -35
datamint/dataset/annotation.py +221 -0
datamint/dataset/base_dataset.py +735 -483
datamint/dataset/dataset.py +33 -16
{datamint-1.6.3.post1.dist-info → datamint-1.7.0.dist-info}/METADATA +1 -1
{datamint-1.6.3.post1.dist-info → datamint-1.7.0.dist-info}/RECORD +10 -9
{datamint-1.6.3.post1.dist-info → datamint-1.7.0.dist-info}/WHEEL +0 -0
{datamint-1.6.3.post1.dist-info → datamint-1.7.0.dist-info}/entry_points.txt +0 -0

datamint/dataset/base_dataset.py CHANGED Viewed

@@ -15,9 +15,12 @@ import torch
 from torch import Tensor
 from datamint.apihandler.base_api_handler import DatamintException
 from medimgkit.dicom_utils import is_dicom
-import cv2
 from medimgkit.io_utils import read_array_normalized
 from datetime import datetime
+from pathlib import Path
+from mimetypes import guess_extension
+from datamint.dataset.annotation import Annotation
+import cv2
 _LOGGER = logging.getLogger(__name__)
@@ -27,12 +30,11 @@ class DatamintDatasetException(DatamintException):
 class DatamintBaseDataset:
-    """
-    Class to download and load datasets from the Datamint API.
+    """Class to download and load datasets from the Datamint API.
     Args:
-        root: Root directory of dataset where data already exists or will be downloaded.
         project_name: Name of the project to download.
+        root: Root directory of dataset where data already exists or will be downloaded.
         auto_update: If True, the dataset will be checked for updates and downloaded if necessary.
         api_key: API key to access the Datamint API. If not provided, it will look for the
             environment variable 'DATAMINT_API_KEY'. Not necessary if
@@ -41,68 +43,114 @@ class DatamintBaseDataset:
         return_metainfo: If True, the metainfo of the image will be returned.
         return_annotations: If True, the annotations of the image will be returned.
         return_frame_by_frame: If True, each frame of a video/DICOM/3d-image will be returned separately.
-        include_unannotated: If True, images without annotations will be included. If False, images without annotations will be discarded.
+        include_unannotated: If True, images without annotations will be included.
         all_annotations: If True, all annotations will be downloaded, including the ones that are not set as closed/done.
         server_url: URL of the Datamint server. If not provided, it will use the default server.
-        include_annotators: List of annotators to include. If None, all annotators will be included. See parameter ``exclude_annotators``.
-        exclude_annotators: List of annotators to exclude. If None, no annotators will be excluded. See parameter ``include_annotators``.
+        include_annotators: List of annotators to include. If None, all annotators will be included.
+        exclude_annotators: List of annotators to exclude. If None, no annotators will be excluded.
         include_segmentation_names: List of segmentation names to include. If None, all segmentations will be included.
         exclude_segmentation_names: List of segmentation names to exclude. If None, no segmentations will be excluded.
         include_image_label_names: List of image label names to include. If None, all image labels will be included.
         exclude_image_label_names: List of image label names to exclude. If None, no image labels will be excluded.
         include_frame_label_names: List of frame label names to include. If None, all frame labels will be included.
         exclude_frame_label_names: List of frame label names to exclude. If None, no frame labels will be excluded.
     """
     DATAMINT_DEFAULT_DIR = ".datamint"
     DATAMINT_DATASETS_DIR = "datasets"
-    def __init__(self,
-                 project_name: str,
-                 root: str | None = None,
-                 auto_update: bool = True,
-                 api_key: Optional[str] = None,
-                 server_url: Optional[str] = None,
-                 return_dicom: bool = False,
-                 return_metainfo: bool = True,
-                 return_annotations: bool = True,
-                 return_frame_by_frame: bool = False,
-                 include_unannotated: bool = True,
-                 all_annotations: bool = False,
-                 # filtering parameters
-                 include_annotators: Optional[list[str]] = None,
-                 exclude_annotators: Optional[list[str]] = None,
-                 include_segmentation_names: Optional[list[str]] = None,
-                 exclude_segmentation_names: Optional[list[str]] = None,
-                 include_image_label_names: Optional[list[str]] = None,
-                 exclude_image_label_names: Optional[list[str]] = None,
-                 include_frame_label_names: Optional[list[str]] = None,
-                 exclude_frame_label_names: Optional[list[str]] = None
-                 ):
-        from datamint.apihandler.api_handler import APIHandler
+    def __init__(
+        self,
+        project_name: str,
+        root: str | None = None,
+        auto_update: bool = True,
+        api_key: Optional[str] = None,
+        server_url: Optional[str] = None,
+        return_dicom: bool = False,
+        return_metainfo: bool = True,
+        return_annotations: bool = True,
+        return_frame_by_frame: bool = False,
+        include_unannotated: bool = True,
+        all_annotations: bool = False,
+        # Filtering parameters
+        include_annotators: Optional[list[str]] = None,
+        exclude_annotators: Optional[list[str]] = None,
+        include_segmentation_names: Optional[list[str]] = None,
+        exclude_segmentation_names: Optional[list[str]] = None,
+        include_image_label_names: Optional[list[str]] = None,
+        exclude_image_label_names: Optional[list[str]] = None,
+        include_frame_label_names: Optional[list[str]] = None,
+        exclude_frame_label_names: Optional[list[str]] = None,
+    ):
+        self._validate_inputs(project_name, include_annotators, exclude_annotators,
+                              include_segmentation_names, exclude_segmentation_names,
+                              include_image_label_names, exclude_image_label_names,
+                              include_frame_label_names, exclude_frame_label_names)
+        self._initialize_config(
+            project_name, auto_update, all_annotations, return_dicom,
+            return_metainfo, return_annotations, return_frame_by_frame,
+            include_unannotated, include_annotators, exclude_annotators,
+            include_segmentation_names, exclude_segmentation_names,
+            include_image_label_names, exclude_image_label_names,
+            include_frame_label_names, exclude_frame_label_names
+        )
+        self._setup_api_handler(server_url, api_key, auto_update)
+        self._setup_directories(root)
+        self._setup_dataset()
+        self._post_process_data()
+    def _validate_inputs(
+        self,
+        project_name: str,
+        include_annotators: Optional[list[str]],
+        exclude_annotators: Optional[list[str]],
+        include_segmentation_names: Optional[list[str]],
+        exclude_segmentation_names: Optional[list[str]],
+        include_image_label_names: Optional[list[str]],
+        exclude_image_label_names: Optional[list[str]],
+        include_frame_label_names: Optional[list[str]],
+        exclude_frame_label_names: Optional[list[str]],
+    ) -> None:
+        """Validate input parameters."""
         if project_name is None:
             raise ValueError("project_name is required.")
+        # Validate mutually exclusive filtering parameters
+        filter_pairs = [
+            (include_annotators, exclude_annotators, "annotators"),
+            (include_segmentation_names, exclude_segmentation_names, "segmentation_names"),
+            (include_image_label_names, exclude_image_label_names, "image_label_names"),
+            (include_frame_label_names, exclude_frame_label_names, "frame_label_names"),
+        ]
+        for include_param, exclude_param, param_name in filter_pairs:
+            if include_param is not None and exclude_param is not None:
+                raise ValueError(f"Cannot set both include_{param_name} and exclude_{param_name} at the same time")
+    def _initialize_config(
+        self,
+        project_name: str,
+        auto_update: bool,
+        all_annotations: bool,
+        return_dicom: bool,
+        return_metainfo: bool,
+        return_annotations: bool,
+        return_frame_by_frame: bool,
+        include_unannotated: bool,
+        include_annotators: Optional[list[str]],
+        exclude_annotators: Optional[list[str]],
+        include_segmentation_names: Optional[list[str]],
+        exclude_segmentation_names: Optional[list[str]],
+        include_image_label_names: Optional[list[str]],
+        exclude_image_label_names: Optional[list[str]],
+        include_frame_label_names: Optional[list[str]],
+        exclude_frame_label_names: Optional[list[str]],
+    ) -> None:
+        """Initialize configuration parameters."""
+        self.project_name = project_name
         self.all_annotations = all_annotations
-        self.api_handler = APIHandler(root_url=server_url, api_key=api_key,
-                                      check_connection=auto_update)
-        self.server_url = self.api_handler.root_url
-        if root is None:
-            # store them in the home directory
-            root = os.path.join(os.path.expanduser("~"),
-                                DatamintBaseDataset.DATAMINT_DEFAULT_DIR)
-            root = os.path.join(root, DatamintBaseDataset.DATAMINT_DATASETS_DIR)
-            if not os.path.exists(root):
-                os.makedirs(root)
-        elif isinstance(root, str):
-            root = os.path.expanduser(root)
-            if not os.path.isdir(root):
-                raise NotADirectoryError(f"Root directory not found: {root}")
-        self.root = root
         self.return_dicom = return_dicom
         self.return_metainfo = return_metainfo
         self.return_frame_by_frame = return_frame_by_frame
@@ -120,108 +168,153 @@ class DatamintBaseDataset:
         self.include_frame_label_names = include_frame_label_names
         self.exclude_frame_label_names = exclude_frame_label_names
-        # Validate filtering parameters
-        if include_annotators is not None and exclude_annotators is not None:
-            raise ValueError("Cannot set both include_annotators and exclude_annotators at the same time")
-        if include_segmentation_names is not None and exclude_segmentation_names is not None:
-            raise ValueError("Cannot set both include_segmentation_names and exclude_segmentation_names at the same time")
-        if include_image_label_names is not None and exclude_image_label_names is not None:
-            raise ValueError("Cannot set both include_image_label_names and exclude_image_label_names at the same time")
-        if include_frame_label_names is not None and exclude_frame_label_names is not None:
-            raise ValueError("Cannot set both include_frame_label_names and exclude_frame_label_names at the same time")
+        # Internal state
+        self.__logged_uint16_conversion = False
+        self.auto_update = auto_update
-        self.project_name = project_name
-        dataset_name = project_name
+    def _setup_api_handler(self, server_url: Optional[str], api_key: Optional[str], auto_update: bool) -> None:
+        """Setup API handler and validate connection."""
+        from datamint.apihandler.api_handler import APIHandler
-        self.dataset_dir = os.path.join(root, dataset_name)
-        self.dataset_zippath = os.path.join(root, f'{dataset_name}.zip')
+        self.api_handler = APIHandler(
+            root_url=server_url,
+            api_key=api_key,
+            check_connection=auto_update
+        )
+        self.server_url = self.api_handler.root_url
+        self.api_key = self.api_handler.api_key
-        local_dataset_exists = os.path.exists(os.path.join(self.dataset_dir, 'dataset.json'))
+        if self.api_key is None:
+            _LOGGER.warning(
+                "API key not provided. If you want to download data, please provide an API key, "
+                f"either by passing it as an argument, "
+                f"setting environment variable {configs.ENV_VARS[configs.APIKEY_KEY]} or "
+                "using datamint-config command line tool."
+            )
-        if local_dataset_exists and auto_update == False:
-            # In this case, we don't need to check the API, so we don't need the id.
-            self.dataset_id = None
+    def _setup_directories(self, root: str | None) -> None:
+        """Setup root and dataset directories."""
+        if root is None:
+            root = os.path.join(
+                os.path.expanduser("~"),
+                self.DATAMINT_DEFAULT_DIR,
+                self.DATAMINT_DATASETS_DIR
+            )
+            os.makedirs(root, exist_ok=True)
         else:
-            self.project_info = self.get_info()
-            self.dataset_id = self.project_info['dataset_id']
+            root = os.path.expanduser(root)
+            if not os.path.isdir(root):
+                raise NotADirectoryError(f"Root directory not found: {root}")
-        self.api_key = self.api_handler.api_key
-        if self.api_key is None:
-            _LOGGER.warning("API key not provided. If you want to download data, please provide an API key, " +
-                            f"either by passing it as an argument," +
-                            f"setting environment variable {configs.ENV_VARS[configs.APIKEY_KEY]} or " +
-                            "using datamint-config command line tool."
-                            )
-        # Download/Updates the dataset, if necessary.
-        if local_dataset_exists:
-            _LOGGER.info(f"Dataset directory already exists: {self.dataset_dir}")
-            if auto_update:
+        self.root = root
+        self.dataset_dir = os.path.join(root, self.project_name)
+        self.dataset_zippath = os.path.join(root, f'{self.project_name}.zip')
+        if not os.path.exists(self.dataset_dir):
+            os.makedirs(self.dataset_dir, exist_ok=True)
+            os.makedirs(os.path.join(self.dataset_dir, 'images'), exist_ok=True)
+            os.makedirs(os.path.join(self.dataset_dir, 'masks'), exist_ok=True)
+    def _setup_dataset(self) -> None:
+        """Setup dataset by downloading or loading existing data."""
+        self._server_dataset_info = None
+        local_load_success = self._load_metadata()
+        self._handle_dataset_download_or_update(local_load_success)
+        self._apply_annotation_filters()
+    def _handle_dataset_download_or_update(self, local_load_success: bool) -> None:
+        """Handle dataset download or update logic."""
+        if local_load_success:
+            _LOGGER.debug(f"Dataset directory already exists: {self.dataset_dir}")
+            # Check for updates if auto_update is enabled and we have API access
+            if self.auto_update:
                 _LOGGER.info("Checking for updates...")
                 self._check_version()
         else:
-            if self.api_key is None:
-                raise DatamintDatasetException("API key is required to download the dataset.")
-            _LOGGER.info(f"No data found at {self.dataset_dir}. Downloading...")
-            self.download_project()
-        # Loads the metadata
-        if not hasattr(self, 'metainfo'):
-            with open(os.path.join(self.dataset_dir, 'dataset.json'), 'r') as file:
+            self._check_version()
+    def _load_metadata(self) -> bool:
+        """Load and process dataset metadata."""
+        if hasattr(self, 'metainfo'):
+            _LOGGER.warning("Metadata already loaded.")
+        metadata_path = os.path.join(self.dataset_dir, 'dataset.json')
+        if not os.path.isfile(metadata_path):
+            # get the server info
+            self.project_info = self.get_info()
+            self.metainfo = self._get_datasetinfo().copy()
+            self.metainfo['updated_at'] = None
+            self.metainfo['resources'] = []
+            self.metainfo['all_annotations'] = self.all_annotations
+            self.images_metainfo = self.metainfo['resources']
+            return False
+        else:
+            with open(metadata_path, 'r') as file:
                 self.metainfo = json.load(file)
         self.images_metainfo = self.metainfo['resources']
+        # Convert annotations from dict to Annotation objects
+        self._convert_metainfo_to_clsobj()
+        return True
-        # filter annotations
+    def _convert_metainfo_to_clsobj(self):
+        for imginfo in self.images_metainfo:
+            if 'annotations' in imginfo:
+                for ann in imginfo['annotations']:
+                    if 'resource_id' not in ann:
+                        ann['resource_id'] = imginfo['id']
+                    if 'id' not in ann:
+                        ann['id'] = None
+                imginfo['annotations'] = [Annotation.from_dict(ann) if isinstance(ann, dict) else ann
+                                          for ann in imginfo['annotations']]
+    def _apply_annotation_filters(self) -> None:
+        """Apply annotation filters and remove unannotated images if needed."""
+        # Filter annotations for each image
         for imginfo in self.images_metainfo:
             imginfo['annotations'] = self._filter_annotations(imginfo['annotations'])
-        # filter out images with no annotations.
+        # Filter out images with no annotations if needed
         if self.discard_without_annotations:
             original_count = len(self.images_metainfo)
             self.images_metainfo = self._filter_items(self.images_metainfo)
             _LOGGER.info(f"Discarded {original_count - len(self.images_metainfo)} images without annotations.")
+    def _post_process_data(self) -> None:
+        """Post-process data after loading metadata."""
         self._check_integrity()
+        self._calculate_dataset_length()
+        self._precompute_frame_data()
+        self._setup_labels()
-        # fix images_metainfo labels
-        # TODO: check tags
-        # for imginfo in self.images_metainfo:
-        #     if imginfo['frame_labels'] is not None:
-        #         for flabels in imginfo['frame_labels']:
-        #             if flabels['label'] is None:
-        #                 flabels['label'] = []
-        #             elif isinstance(flabels['label'], str):
-        #                 flabels['label'] = flabels['label'].split(',')
+        if self.discard_without_annotations and self.return_frame_by_frame:
+            self._filter_unannotated()
+    def _calculate_dataset_length(self) -> None:
+        """Calculate the total dataset length based on frame-by-frame setting."""
         if self.return_frame_by_frame:
-            self.dataset_length = 0
-            for imginfo in self.images_metainfo:
-                filepath = os.path.join(self.dataset_dir, imginfo['file'])
-                self.dataset_length += self.read_number_of_frames(filepath)
+            self.dataset_length = sum(
+                self.read_number_of_frames(os.path.join(self.dataset_dir, imginfo['file']))
+                for imginfo in self.images_metainfo
+            )
         else:
             self.dataset_length = len(self.images_metainfo)
+    def _precompute_frame_data(self) -> None:
+        """Precompute frame-related data for efficient indexing."""
         self.num_frames_per_resource = self.__compute_num_frames_per_resource()
-        # Precompute cumulative frame counts for faster index lookup
         self._cumulative_frames = np.cumsum([0] + self.num_frames_per_resource)
         self.subset_indices = list(range(self.dataset_length))
-        # self.labels_set, self.label2code, self.segmentation_labels, self.segmentation_label2code = self.get_labels_set()
+    def _setup_labels(self) -> None:
+        """Setup label sets and mappings."""
         self.frame_lsets, self.frame_lcodes = self._get_labels_set(framed=True)
         self.image_lsets, self.image_lcodes = self._get_labels_set(framed=False)
-        self.__logged_uint16_conversion = False
-        if self.discard_without_annotations and self.return_frame_by_frame:
-            # If we are returning frame by frame, we need to filter out frames without segmentations
-            self._filter_unannotated()
     def _filter_items(self, images_metainfo: list[dict]) -> list[dict]:
+        """Filter items that have annotations."""
         return [img for img in images_metainfo if len(img.get('annotations', []))]
-    def _filter_unannotated(self):
+    def _filter_unannotated(self) -> None:
         """Filter out frames that don't have any segmentations."""
         filtered_indices = []
         for i in range(len(self.subset_indices)):
@@ -229,124 +322,125 @@ class DatamintBaseDataset:
             annotations = item_meta.get('annotations', [])
             # Check if there are any segmentation annotations
-            has_segmentations = any(ann['type'] == 'segmentation' for ann in annotations)
+            has_segmentations = any(ann.type == 'segmentation' for ann in annotations)
             if has_segmentations:
                 filtered_indices.append(self.subset_indices[i])
         self.subset_indices = filtered_indices
-        print(f"Filtered dataset: {len(self.subset_indices)} frames with segmentations")
+        _LOGGER.debug(f"Filtered dataset: {len(self.subset_indices)} frames with segmentations")
     def __compute_num_frames_per_resource(self) -> list[int]:
-        num_frames_per_dicom = []
-        for imginfo in self.images_metainfo:
-            filepath = os.path.join(self.dataset_dir, imginfo['file'])
-            num_frames_per_dicom.append(self.read_number_of_frames(filepath))
-        return num_frames_per_dicom
+        """Compute number of frames for each resource."""
+        return [
+            self.read_number_of_frames(os.path.join(self.dataset_dir, imginfo['file']))
+            for imginfo in self.images_metainfo
+        ]
     @property
     def frame_labels_set(self) -> list[str]:
-        """
-        Returns the set of independent labels in the dataset.
-        This is more related to multi-label tasks.
-        """
+        """Returns the set of independent labels in the dataset (multi-label tasks)."""
         return self.frame_lsets['multilabel']
     @property
     def frame_categories_set(self) -> list[tuple[str, str]]:
-        """
-        Returns the set of categories in the dataset.
-        This is more related to multi-class tasks.
-        """
+        """Returns the set of categories in the dataset (multi-class tasks)."""
         return self.frame_lsets['multiclass']
     @property
     def image_labels_set(self) -> list[str]:
-        """
-        Returns the set of independent labels in the dataset.
-        This is more related to multi-label tasks.
-        """
+        """Returns the set of independent labels in the dataset (multi-label tasks)."""
         return self.image_lsets['multilabel']
     @property
     def image_categories_set(self) -> list[tuple[str, str]]:
-        """
-        Returns the set of categories in the dataset.
-        This is more related to multi-class tasks.
-        """
+        """Returns the set of categories in the dataset (multi-class tasks)."""
         return self.image_lsets['multiclass']
     @property
     def segmentation_labels_set(self) -> list[str]:
-        """
-        Returns the set of segmentation labels in the dataset.
-        """
+        """Returns the set of segmentation labels in the dataset."""
         return self.frame_lsets['segmentation']
-    def _get_annotations_internal(self,
-                                  annotations: list[dict],
-                                  type: Literal['label', 'category', 'segmentation', 'all'] = 'all',
-                                  scope: Literal['frame', 'image', 'all'] = 'all') -> list[dict]:
-        # check parameters
+    def _get_annotations_internal(
+        self,
+        annotations: list[Annotation],
+        type: Literal['label', 'category', 'segmentation', 'all'] = 'all',
+        scope: Literal['frame', 'image', 'all'] = 'all'
+    ) -> list[Annotation]:
+        """Internal method to filter annotations by type and scope."""
         if type not in ['label', 'category', 'segmentation', 'all']:
             raise ValueError(f"Invalid value for 'type': {type}")
         if scope not in ['frame', 'image', 'all']:
             raise ValueError(f"Invalid value for 'scope': {scope}")
-        annots = []
+        filtered_annotations = []
         for ann in annotations:
-            ann_scope = 'image' if ann.get('index', None) is None else 'frame'
-            if (type == 'all' or ann['type'] == type) and (scope == 'all' or scope == ann_scope):
-                annots.append(ann)
-        return annots
-    def get_annotations(self,
-                        index: int,
-                        type: Literal['label', 'category', 'segmentation', 'all'] = 'all',
-                        scope: Literal['frame', 'image', 'all'] = 'all') -> list[dict]:
-        """
-        Returns the annotations of the image at the given index.
+            ann_scope = 'image' if ann.index is None else 'frame'
+            type_matches = type == 'all' or ann.type == type
+            scope_matches = scope == 'all' or scope == ann_scope
+            if type_matches and scope_matches:
+                filtered_annotations.append(ann)
+        return filtered_annotations
+    def get_annotations(
+        self,
+        index: int,
+        type: Literal['label', 'category', 'segmentation', 'all'] = 'all',
+        scope: Literal['frame', 'image', 'all'] = 'all'
+    ) -> list[Annotation]:
+        """Returns the annotations of the image at the given index.
         Args:
-            index (int): Index of the image.
-            type (str): The type of the annotations. It can be 'label', 'category', 'segmentation' or 'all'.
-            scope (str): The scope of the annotations. It can be 'frame', 'image' or 'all'.
+            index: Index of the image.
+            type: The type of the annotations. Can be 'label', 'category', 'segmentation' or 'all'.
+            scope: The scope of the annotations. Can be 'frame', 'image' or 'all'.
         Returns:
-            list[dict]: The annotations of the image.
+            The annotations of the image.
         """
         if index >= len(self):
             raise IndexError(f"Index {index} out of bounds for dataset of length {len(self)}")
         imginfo = self._get_image_metainfo(index)
         return self._get_annotations_internal(imginfo['annotations'], type=type, scope=scope)
     @staticmethod
     def read_number_of_frames(filepath: str) -> int:
-        # if is dicom
+        """Read the number of frames in a file."""
         if is_dicom(filepath):
             ds = pydicom.dcmread(filepath)
-            return ds.NumberOfFrames if hasattr(ds, 'NumberOfFrames') else 1
-        # if is a video
-        elif filepath.endswith('.mp4') or filepath.endswith('.avi'):
+            return getattr(ds, 'NumberOfFrames', 1)
+        elif filepath.lower().endswith(('.mp4', '.avi')):
             cap = cv2.VideoCapture(filepath)
-            return int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-        # if is a image
-        elif filepath.endswith('.png') or filepath.endswith('.jpg') or filepath.endswith('.jpeg'):
+            try:
+                return int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+            finally:
+                cap.release()
+        elif filepath.lower().endswith(('.png', '.jpg', '.jpeg')):
             return 1
         else:
             raise ValueError(f"Unsupported file type: {filepath}")
     def get_resources_ids(self) -> list[str]:
-        return [self.__getitem_internal(i, only_load_metainfo=True)['metainfo']['id'] for i in self.subset_indices]
+        """Get list of resource IDs."""
+        return [
+            self.__getitem_internal(i, only_load_metainfo=True)['metainfo']['id']
+            for i in self.subset_indices
+        ]
     def _get_labels_set(self, framed: bool) -> tuple[dict, dict[str, dict[str, int]]]:
-        """
-        Returns the set of labels and a dictionary that maps labels to integers.
+        """Returns the set of labels and mappings to integers.
+        Args:
+            framed: If True, get frame-level labels, otherwise image-level labels.
         Returns:
-            Tuple[List[str], Dict[str, int]]: The set of labels and the dictionary that maps labels to integers
+            Tuple containing label sets and label-to-code mappings.
         """
         scope = 'frame' if framed else 'image'
         multilabel_set = set()
@@ -354,100 +448,113 @@ class DatamintBaseDataset:
         multiclass_set = set()
         for i in range(len(self)):
-            anns = self.get_annotations(i, type='label', scope=scope)
-            multilabel_set.update([ann['name'] for ann in anns])
+            # Collect labels by type
+            label_anns = self.get_annotations(i, type='label', scope=scope)
+            multilabel_set.update(ann.name for ann in label_anns)
-            anns = self.get_annotations(i, type='segmentation', scope=scope)
-            segmentation_labels.update([ann['name'] for ann in anns])
+            seg_anns = self.get_annotations(i, type='segmentation', scope=scope)
+            segmentation_labels.update(ann.name for ann in seg_anns)
-            anns = self.get_annotations(i, type='category', scope=scope)
-            multiclass_set.update([(ann['name'], ann['value']) for ann in anns])
+            cat_anns = self.get_annotations(i, type='category', scope=scope)
+            multiclass_set.update((ann.name, ann.value) for ann in cat_anns)
-        multilabel_set = sorted(list(multilabel_set))
-        multiclass_set = sorted(list(multiclass_set))
-        segmentation_labels = sorted(list(segmentation_labels))
+        # Sort and create mappings
+        multilabel_list = sorted(multilabel_set)
+        multiclass_list = sorted(multiclass_set)
+        segmentation_list = sorted(segmentation_labels)
-        multilabel2code = {label: idx for idx, label in enumerate(multilabel_set)}
-        segmentation_label2code = {label: idx+1 for idx, label in enumerate(segmentation_labels)}
-        multiclass2code = {label: idx for idx, label in enumerate(multiclass_set)}
+        sets = {
+            'multilabel': multilabel_list,
+            'segmentation': segmentation_list,
+            'multiclass': multiclass_list
+        }
+        codes_map = {
+            'multilabel': {label: idx for idx, label in enumerate(multilabel_list)},
+            'segmentation': {label: idx + 1 for idx, label in enumerate(segmentation_list)},
+            'multiclass': {label: idx for idx, label in enumerate(multiclass_list)}
+        }
-        sets = {'multilabel': multilabel_set,
-                'segmentation': segmentation_labels,
-                'multiclass': multiclass_set}
-        codes_map = {'multilabel': multilabel2code,
-                     'segmentation': segmentation_label2code,
-                     'multiclass': multiclass2code}
         return sets, codes_map
-    def get_framelabel_distribution(self, normalize=False) -> dict[str, float]:
-        """
-        Returns the distribution of labels in the dataset.
+    def get_framelabel_distribution(self, normalize: bool = False) -> dict[str, float]:
+        """Returns the distribution of frame labels in the dataset."""
+        return self._get_label_distribution('label', 'frame', normalize)
-        Returns:
-            Dict[str, int]: The distribution of labels in the dataset.
-        """
-        label_distribution = {label: 0 for label in self.frame_labels_set}
-        for imginfo in self.images_metainfo:
-            for ann in imginfo['annotations']:
-                if ann['type'] == 'label' and ann['index'] is not None:
-                    label_distribution[ann['name']] += 1
+    def get_segmentationlabel_distribution(self, normalize: bool = False) -> dict[str, float]:
+        """Returns the distribution of segmentation labels in the dataset."""
+        return self._get_label_distribution('segmentation', 'all', normalize)
-        if normalize:
-            total = sum(label_distribution.values())
-            if total == 0:
-                return label_distribution
-            label_distribution = {k: v/total for k, v in label_distribution.items()}
-        return label_distribution
+    def _get_label_distribution(self, ann_type: str, scope: str, normalize: bool) -> dict[str, float]:
+        """Helper method to calculate label distributions."""
+        if ann_type == 'label' and scope == 'frame':
+            labels = self.frame_labels_set
+        elif ann_type == 'segmentation':
+            labels = self.segmentation_labels_set
+        else:
+            raise ValueError(f"Unsupported combination: type={ann_type}, scope={scope}")
-    def get_segmentationlabel_distribution(self, normalize=False) -> dict[str, float]:
-        """
-        Returns the distribution of segmentation labels in the dataset.
+        distribution = {label: 0 for label in labels}
-        Returns:
-            Dict[str, int]: The distribution of segmentation labels in the dataset.
-        """
-        label_distribution = {label: 0 for label in self.segmentation_labels_set}
         for imginfo in self.images_metainfo:
-            if 'annotations' in imginfo and imginfo['annotations'] is not None:
-                for ann in imginfo['annotations']:
-                    if ann['type'] == 'segmentation':
-                        label_distribution[ann['name']] += 1
+            for ann in imginfo.get('annotations', []):
+                condition_met = (
+                    ann.type == ann_type and
+                    (scope == 'all' or
+                     (scope == 'frame' and ann.index is not None) or
+                     (scope == 'image' and ann.index is None))
+                )
+                if condition_met and ann.name in distribution:
+                    distribution[ann.name] += 1
         if normalize:
-            total = sum(label_distribution.values())
-            if total == 0:
-                return label_distribution
-            label_distribution = {k: v/total for k, v in label_distribution.items()}
-        return label_distribution
+            total = sum(distribution.values())
+            if total > 0:
+                distribution = {k: v / total for k, v in distribution.items()}
-    def _check_integrity(self):
+        return distribution
+    def _check_integrity(self) -> None:
+        """Check if all image files exist."""
+        missing_files = []
         for imginfo in self.images_metainfo:
-            if not os.path.isfile(os.path.join(self.dataset_dir, imginfo['file'])):
-                raise DatamintDatasetException(f"Image file {imginfo['file']} not found.")
+            filepath = os.path.join(self.dataset_dir, imginfo['file'])
+            if not os.path.isfile(filepath):
+                missing_files.append(imginfo['file'])
+        if missing_files:
+            raise DatamintDatasetException(f"Image files not found: {missing_files}")
     def _get_datasetinfo(self) -> dict:
+        """Get dataset information from API."""
+        if self._server_dataset_info is not None:
+            return self._server_dataset_info
         all_datasets = self.api_handler.get_datasets()
-        value_to_search = self.dataset_id
-        field_to_search = 'id'
-        for d in all_datasets:
-            if d[field_to_search] == value_to_search:
-                return d
+        for dataset in all_datasets:
+            if dataset['id'] == self.dataset_id:
+                self._server_dataset_info = dataset
+                return dataset
         available_datasets = [(d['name'], d['id']) for d in all_datasets]
         raise DatamintDatasetException(
-            f"Dataset with {field_to_search} '{value_to_search}' not found." +
-            f" Available datasets: {available_datasets}"
+            f"Dataset with id '{self.dataset_id}' not found. "
+            f"Available datasets: {available_datasets}"
         )
     def get_info(self) -> dict:
+        """Get project information from API."""
+        if hasattr(self, 'project_info') and self.project_info is not None:
+            return self.project_info
         project = self.api_handler.get_project_by_name(self.project_name)
         if 'error' in project:
             available_projects = project['all_projects']
             raise DatamintDatasetException(
-                f"Project with name '{self.project_name}' not found. Available projects: {available_projects}"
+                f"Project with name '{self.project_name}' not found. "
+                f"Available projects: {available_projects}"
             )
+        self.project_info = project
+        self.dataset_id = project['dataset_id']
         return project
     def _run_request(self, session, request_args) -> requests.Response:
@@ -457,216 +564,191 @@ class DatamintBaseDataset:
         response.raise_for_status()
         return response
-    def _get_jwttoken(self, dataset_id, session) -> str:
-        if dataset_id is None:
-            raise ValueError("Dataset ID is required to download the dataset.")
-        request_params = {
-            'method': 'GET',
-            'url': f'{self.server_url}/datasets/{dataset_id}/download/png',
-            'headers': {'apikey': self.api_key},
-            'stream': True
-        }
-        _LOGGER.debug(f"Getting jwt token for dataset {dataset_id}...")
-        response = self._run_request(session, request_params)
-        progress_bar = None
-        number_processed_images = 0
-        # check if the response is a stream of data and everything is ok
-        if response.status_code != 200:
-            msg = f"Getting jwt token failed with status code={response.status_code}: {response.text}"
-            raise DatamintDatasetException(msg)
-        try:
-            response_iterator = response.iter_lines(decode_unicode=True)
-            for line in response_iterator:
-                line = line.strip()
-                if 'event: error' in line:
-                    error_msg = line+'\n'
-                    error_msg += '\n'.join(response_iterator)
-                    raise DatamintDatasetException(f"Getting jwt token failed:\n{error_msg}")
-                if not line.startswith('data:'):
-                    continue
-                dataline = yaml.safe_load(line)['data']
-                if 'zip' in dataline:
-                    _LOGGER.debug(f"Got jwt token for dataset {dataset_id}")
-                    return dataline['zip']  # Function normally ends here
-                elif 'processedImages' in dataline:
-                    if progress_bar is None:
-                        total_size = int(dataline['totalImages'])
-                        progress_bar = tqdm(total=total_size, unit='iB', unit_scale=True)
-                    processed_images = int(dataline['processedImages'])
-                    if number_processed_images < processed_images:
-                        progress_bar.update(processed_images - number_processed_images)
-                        number_processed_images = processed_images
-                else:
-                    _LOGGER.warning(f"Unknown data line: {dataline}")
-        except Exception as e:
-            raise e
-        finally:
-            if progress_bar is not None:
-                progress_bar.close()
-        raise DatamintDatasetException("Getting jwt token failed! No dataline with 'zip' entry found.")
     def __repr__(self) -> str:
-        """
-        Example:
-            .. code-block:: python
-                print(dataset)
-            Output:
-            .. code-block:: text
-                Dataset DatamintDataset
-                    Number of datapoints: 3
-                    Root location: /home/user/.datamint/datasets
-        """
+        """String representation of the dataset."""
         head = f"Dataset {self.project_name}"
         body = [f"Number of datapoints: {self.__len__()}"]
         if self.root is not None:
             body.append(f"Location: {self.dataset_dir}")
-        # Add filter information to representation
-        if self.include_annotators is not None:
-            body += [f"Including only annotators: {self.include_annotators}"]
-        if self.exclude_annotators is not None:
-            body += [f"Excluding annotators: {self.exclude_annotators}"]
-        if self.include_segmentation_names is not None:
-            body += [f"Including only segmentations: {self.include_segmentation_names}"]
-        if self.exclude_segmentation_names is not None:
-            body += [f"Excluding segmentations: {self.exclude_segmentation_names}"]
-        if self.include_image_label_names is not None:
-            body += [f"Including only image labels: {self.include_image_label_names}"]
-        if self.exclude_image_label_names is not None:
-            body += [f"Excluding image labels: {self.exclude_image_label_names}"]
-        if self.include_frame_label_names is not None:
-            body += [f"Including only frame labels: {self.include_frame_label_names}"]
-        if self.exclude_frame_label_names is not None:
-            body += [f"Excluding frame labels: {self.exclude_frame_label_names}"]
+        # Add filter information
+        filter_info = [
+            (self.include_annotators, "Including only annotators"),
+            (self.exclude_annotators, "Excluding annotators"),
+            (self.include_segmentation_names, "Including only segmentations"),
+            (self.exclude_segmentation_names, "Excluding segmentations"),
+            (self.include_image_label_names, "Including only image labels"),
+            (self.exclude_image_label_names, "Excluding image labels"),
+            (self.include_frame_label_names, "Including only frame labels"),
+            (self.exclude_frame_label_names, "Excluding frame labels"),
+        ]
+        for filter_value, description in filter_info:
+            if filter_value is not None:
+                body.append(f"{description}: {filter_value}")
         lines = [head] + [" " * 4 + line for line in body]
         return "\n".join(lines)
-    def download_project(self):
-        from torchvision.datasets.utils import extract_archive
+    def download_project(self) -> None:
+        """Download project data from API."""
         dataset_info = self._get_datasetinfo()
         self.dataset_id = dataset_info['id']
         self.last_updaded_at = dataset_info['updated_at']
-        self.api_handler.download_project(self.project_info['id'],
-                                          self.dataset_zippath,
-                                          all_annotations=self.all_annotations,
-                                          include_unannotated=self.include_unannotated)
-        _LOGGER.debug(f"Downloaded dataset")
-        downloaded_size = os.path.getsize(self.dataset_zippath)
-        if downloaded_size == 0:
+        self.api_handler.download_project(
+            self.project_info['id'],
+            self.dataset_zippath,
+            all_annotations=self.all_annotations,
+            include_unannotated=self.include_unannotated
+        )
+        _LOGGER.debug("Downloaded dataset")
+        if os.path.getsize(self.dataset_zippath) == 0:
             raise DatamintDatasetException("Download failed.")
+        self._extract_and_update_metadata()
+    def _get_dataset_id(self) -> str:
+        if self.dataset_id is None:
+            dataset_info = self._get_datasetinfo()
+            self.dataset_id = dataset_info['id']
+        return self.dataset_id
+    def _extract_and_update_metadata(self) -> None:
+        """Extract downloaded archive and update metadata."""
+        from torchvision.datasets.utils import extract_archive
         if os.path.exists(self.dataset_dir):
             _LOGGER.info(f"Deleting existing dataset directory: {self.dataset_dir}")
             shutil.rmtree(self.dataset_dir)
-        extract_archive(self.dataset_zippath,
-                        self.dataset_dir,
-                        remove_finished=True
-                        )
-        datasetjson = os.path.join(self.dataset_dir, 'dataset.json')
-        with open(datasetjson, 'r') as file:
+        extract_archive(self.dataset_zippath, self.dataset_dir, remove_finished=True)
+        # Load and update metadata
+        datasetjson_path = os.path.join(self.dataset_dir, 'dataset.json')
+        with open(datasetjson_path, 'r') as file:
             self.metainfo = json.load(file)
+        self._update_metadata_timestamps()
+        # Save updated metadata
+        with open(datasetjson_path, 'w') as file:
+            json.dump(self.metainfo, file, default=lambda o: o.to_dict() if hasattr(o, 'to_dict') else o)
+        self.images_metainfo = self.metainfo['resources']
+        # self._convert_metainfo_to_clsobj()
+    def _update_metadata_timestamps(self) -> None:
+        """Update metadata with correct timestamps."""
         if 'updated_at' not in self.metainfo:
             self.metainfo['updated_at'] = self.last_updaded_at
         else:
-            # if self.last_updated_at is newer than the one in the dataset, update it
             try:
-                if datetime.fromisoformat(self.metainfo['updated_at']) < datetime.fromisoformat(self.last_updaded_at):
-                    _LOGGER.warning(f"Inconsistent updated_at dates detected ({self.metainfo['updated_at']} < {self.last_updaded_at})." +
-                                    f"Fixing it to {self.last_updaded_at}")
+                local_time = datetime.fromisoformat(self.metainfo['updated_at'])
+                server_time = datetime.fromisoformat(self.last_updaded_at)
+                if local_time < server_time:
+                    _LOGGER.warning(
+                        f"Inconsistent updated_at dates detected "
+                        f"({self.metainfo['updated_at']} < {self.last_updaded_at}). "
+                        f"Fixing it to {self.last_updaded_at}"
+                    )
                     self.metainfo['updated_at'] = self.last_updaded_at
             except Exception as e:
                 _LOGGER.warning(f"Failed to parse updated_at date: {e}")
-        # Add all_annotations to the metadata
         self.metainfo['all_annotations'] = self.all_annotations
-        # save the updated_at date
-        with open(datasetjson, 'w') as file:
-            json.dump(self.metainfo, file)
-    def _load_image(self, filepath: str,
-                    index: int | None = None) -> tuple[Tensor, FileDataset | None]:
+    def _load_image(self, filepath: str, index: int | None = None) -> tuple[Tensor, FileDataset | None]:
+        """Load image from file with optional frame index."""
         if os.path.isdir(filepath):
-            raise NotImplementedError("Loading a image from a directory is not supported yet.")
+            raise NotImplementedError("Loading an image from a directory is not supported yet.")
         if self.return_frame_by_frame:
             img, ds = read_array_normalized(filepath, return_metainfo=True, index=index)
         else:
             img, ds = read_array_normalized(filepath, return_metainfo=True)
+        img = self._process_image_array(img)
+        return img, ds
+    def _process_image_array(self, img: np.ndarray) -> Tensor:
+        """Process numpy array to tensor with proper normalization."""
         if img.dtype == np.uint16:
             if not self.__logged_uint16_conversion:
                 _LOGGER.info("Original image is uint16, converting to uint8")
                 self.__logged_uint16_conversion = True
-            # min-max normalization
+            # Min-max normalization
             img = img.astype(np.float32)
-            mn = img.min()
-            img = (img - mn) / (img.max() - mn) * 255
+            min_val = img.min()
+            img = (img - min_val) / (img.max() - min_val) * 255
             img = img.astype(np.uint8)
-        img = torch.from_numpy(img).contiguous()
-        if isinstance(img, torch.ByteTensor):
-            img = img.to(dtype=torch.get_default_dtype()).div(255)
+        img_tensor = torch.from_numpy(img).contiguous()
-        return img, ds
+        if isinstance(img_tensor, torch.ByteTensor):
+            img_tensor = img_tensor.to(dtype=torch.get_default_dtype()).div(255)
+        return img_tensor
-    def _get_image_metainfo(self, index: int, bypass_subset_indices=False) -> dict[str, Any]:
+    def _get_image_metainfo(self, index: int, bypass_subset_indices: bool = False) -> dict[str, Any]:
+        """Get metadata for image at given index."""
         if not bypass_subset_indices:
             index = self.subset_indices[index]
         if self.return_frame_by_frame:
-            # Find the correct filepath and index
             resource_id, frame_index = self.__find_index(index)
-            img_metainfo = self.images_metainfo[resource_id]
-            img_metainfo = dict(img_metainfo)  # copy
-            # insert frame index
+            img_metainfo = dict(self.images_metainfo[resource_id])  # Copy
             img_metainfo['frame_index'] = frame_index
-            img_metainfo['annotations'] = [ann for ann in img_metainfo['annotations']
-                                           if ann['index'] is None or ann['index'] == frame_index]
+            img_metainfo['annotations'] = [
+                ann for ann in img_metainfo['annotations']
+                if ann.index is None or ann.index == frame_index
+            ]
         else:
             img_metainfo = self.images_metainfo[index]
         return img_metainfo
     def __find_index(self, index: int) -> tuple[int, int]:
-        """
-        Find the resource index and frame index for a given global frame index.
-        """
-        # Use binary search to find the resource containing this frame
+        """Find the resource index and frame index for a given global frame index."""
         resource_index = np.searchsorted(self._cumulative_frames[1:], index, side='right')
         frame_index = index - self._cumulative_frames[resource_index]
         return resource_index, frame_index
-    def __getitem_internal(self, index: int,
-                           only_load_metainfo=False) -> dict[str, Tensor | FileDataset | dict | list]:
+    def __getitem_internal(
+        self,
+        index: int,
+        only_load_metainfo: bool = False
+    ) -> dict[str, Tensor | FileDataset | dict | list]:
+        """Internal method to get item at index."""
         if self.return_frame_by_frame:
             resource_index, frame_idx = self.__find_index(index)
         else:
             resource_index = index
             frame_idx = None
         img_metainfo = self._get_image_metainfo(index, bypass_subset_indices=True)
         if only_load_metainfo:
             return {'metainfo': img_metainfo}
         filepath = os.path.join(self.dataset_dir, img_metainfo['file'])
-        # Can be multi-frame, Gray-scale and/or RGB. So the shape is really variable, but it's always a numpy array.
         img, ds = self._load_image(filepath, frame_idx)
+        return self._build_item_dict(img, ds, img_metainfo)
+    def _build_item_dict(
+        self,
+        img: Tensor,
+        ds: FileDataset | None,
+        img_metainfo: dict
+    ) -> dict[str, Any]:
+        """Build the return dictionary for __getitem__."""
         ret = {'image': img}
         if self.return_dicom:
@@ -678,52 +760,42 @@ class DatamintBaseDataset:
         return ret
-    def _filter_annotations(self, annotations: list[dict]) -> list[dict]:
-        """
-        Filter annotations based on the filtering settings.
-        Args:
-            annotations: list of annotations
-        Returns:
-            list[dict]: filtered list of annotations
-        """
+    def _filter_annotations(self, annotations: list[Annotation]) -> list[Annotation]:
+        """Filter annotations based on the filtering settings."""
         if annotations is None:
             return []
         filtered_annotations = []
         for ann in annotations:
-            # Filter by annotator
-            if not self._should_include_annotator(ann['added_by']):
+            if not self._should_include_annotation(ann):
                 continue
-            # Filter by annotation type and name
-            if ann['type'] == 'segmentation':
-                if not self._should_include_segmentation(ann['name']):
-                    continue
-            elif ann['type'] == 'label':
-                # Check if it's a frame or image label
-                if ann.get('index', None) is None:
-                    # Image label
-                    if not self._should_include_image_label(ann['name']):
-                        continue
-                else:
-                    # Frame label
-                    if not self._should_include_frame_label(ann['name']):
-                        continue
-            # If we reach here, the annotation passed all filters
             filtered_annotations.append(ann)
         return filtered_annotations
+    def _should_include_annotation(self, ann: Annotation) -> bool:
+        """Check if an annotation should be included based on all filters."""
+        if not self._should_include_annotator(ann.created_by):
+            return False
+        if ann.type == 'segmentation':
+            return self._should_include_segmentation(ann.name)
+        elif ann.type == 'label':
+            if ann.index is None:
+                return self._should_include_image_label(ann.name)
+            else:
+                return self._should_include_frame_label(ann.name)
+        return True
     def __getitem__(self, index: int) -> dict[str, Tensor | FileDataset | dict | list]:
-        """
+        """Get item at index.
         Args:
-            index (int): Index
+            index: Index
         Returns:
-            dict: A dictionary containing three keys: 'image', 'metainfo' and 'annotations'.
+            A dictionary containing 'image', 'metainfo' and 'annotations' keys.
         """
         if index >= len(self):
             raise IndexError(f"Index {index} out of bounds for dataset of length {len(self)}")
@@ -731,21 +803,28 @@ class DatamintBaseDataset:
         return self.__getitem_internal(self.subset_indices[index])
     def __iter__(self):
+        """Iterate over dataset items."""
         for index in self.subset_indices:
-            yield self.__getitem_internal(index)
+            yield self.__getitem__(index)
+            # do not use __getitem_internal__ here, so subclass only need to implement __getitem__
     def __len__(self) -> int:
+        """Return dataset length."""
         return len(self.subset_indices)
-    def _check_version(self):
-        metainfo_path = os.path.join(self.dataset_dir, 'dataset.json')
-        if not os.path.exists(metainfo_path):
-            self.download_project()
-            return
-        with open(metainfo_path, 'r') as file:
-            local_dataset_info = json.load(file)
-        local_updated_at = local_dataset_info.get('updated_at', None)
-        local_all_annotations = local_dataset_info.get('all_annotations', None)
+    def _check_version(self) -> None:
+        """Check if local dataset version is up to date."""
+        # metainfo_path = os.path.join(self.dataset_dir, 'dataset.json')
+        # if not os.path.exists(metainfo_path):
+        #     self.download_project()
+        #     return
+        if not hasattr(self, 'project_info'):
+            self.project_info = self.get_info()
+            self.dataset_id = self.project_info['dataset_id']
+        local_updated_at = self.metainfo.get('updated_at', None)
+        local_all_annotations = self.metainfo.get('all_annotations', None)
         try:
             external_metadata_info = self._get_datasetinfo()
@@ -756,82 +835,279 @@ class DatamintBaseDataset:
         _LOGGER.debug(f"Local updated at: {local_updated_at}, Server updated at: {server_updated_at}")
-        # Check if all_annotations changed or doesn't exist
         annotations_changed = local_all_annotations != self.all_annotations
+        version_outdated = local_updated_at is None or local_updated_at < server_updated_at
-        if local_updated_at is None or local_updated_at < server_updated_at or annotations_changed:
-            if annotations_changed:
-                _LOGGER.info(
-                    f"The 'all_annotations' parameter has changed. Previous: {local_all_annotations}, Current: {self.all_annotations}."
-                )
-            else:
-                _LOGGER.info(
-                    f"A newer version of the dataset is available. Your version: {local_updated_at}." +
-                    f" Last version: {server_updated_at}."
-                )
-            self.download_project()
+        if annotations_changed:
+            _LOGGER.info(
+                f"The 'all_annotations' parameter has changed. "
+                f"Previous: {local_all_annotations}, Current: {self.all_annotations}."
+            )
+            # self.download_project()
+            self._incremental_update()
+        elif version_outdated:
+            _LOGGER.info(
+                f"A newer version of the dataset is available. "
+                f"Your version: {local_updated_at}. Last version: {server_updated_at}."
+            )
+            self._incremental_update()
         else:
             _LOGGER.info('Local version is up to date with the latest version.')
+    def _fetch_new_resources(self,
+                             all_uptodate_resources: list[dict]) -> list[dict]:
+        local_resources = self.images_metainfo
+        local_resources_ids = [res['id'] for res in local_resources]
+        new_resources = []
+        for resource in all_uptodate_resources:
+            if resource['id'] not in local_resources_ids:
+                resource['file'] = str(self._get_resource_file_path(resource))
+                resource['annotations'] = []
+                new_resources.append(resource)
+        return new_resources
+    def _fetch_deleted_resources(self, all_uptodate_resources: list[dict]) -> list[dict]:
+        local_resources = self.images_metainfo
+        all_uptodate_resources_ids = [res['id'] for res in all_uptodate_resources]
+        deleted_resources = []
+        for resource in local_resources:
+            try:
+                res_idx = all_uptodate_resources_ids.index(resource['id'])
+                if resource.get('deleted_at', None):  # was deleted on server
+                    if local_resources[res_idx].get('deleted_at_local', None) is None:
+                        deleted_resources.append(resource)
+            except ValueError:
+                deleted_resources.append(resource)
+        return deleted_resources
+    def _incremental_update(self) -> None:
+        # local_updated_at = self.metainfo.get('updated_at', None)
+        # external_metadata_info = self._get_datasetinfo()
+        # server_updated_at = external_metadata_info['updated_at']
+        ### RESOURCES ###
+        all_uptodate_resources = self.api_handler.get_project_resources(self.get_info()['id'])
+        new_resources = self._fetch_new_resources(all_uptodate_resources)
+        deleted_resources = self._fetch_deleted_resources(all_uptodate_resources)
+        if new_resources:
+            for r in new_resources:
+                self._new_resource_created(r)
+            new_resources_path = [Path(self.dataset_dir) / r['file'] for r in new_resources]
+            new_resources_ids = [r['id'] for r in new_resources]
+            _LOGGER.info(f"Downloading {len(new_resources)} new resources...")
+            self.api_handler.download_multiple_resources(new_resources_ids,
+                                                        save_path=new_resources_path)
+            _LOGGER.info(f"Downloaded {len(new_resources)} new resources.")
+        for r in deleted_resources:
+            self._resource_deleted(r)
+        ################
+        ### ANNOTATIONS ###
+        all_annotations = self.api_handler.get_annotations(worklist_id=self.project_info['worklist_id'],
+                                                           status='published' if self.all_annotations else None)
+        # group annotations by resource ID
+        annotations_by_resource = {}
+        for ann in all_annotations:
+            # add the local filepath
+            filepath = self._get_annotation_file_path(ann)
+            if filepath is not None:
+                ann['file'] = str(filepath)
+            resource_id = ann['resource_id']
+            if resource_id not in annotations_by_resource:
+                annotations_by_resource[resource_id] = []
+            annotations_by_resource[resource_id].append(ann)
+        # Collect all segmentation annotations that need to be downloaded
+        segmentations_to_download = []
+        segmentation_paths = []
+        # update annotations in resources
+        for resource in self.images_metainfo:
+            resource_id = resource['id']
+            new_resource_annotations = annotations_by_resource.get(resource_id, [])
+            old_resource_annotations = resource.get('annotations', [])
+            # check if segmentation annotations need to be downloaded
+            # Also check if annotations need to be deleted
+            old_ann_ids = set([ann.id for ann in old_resource_annotations if hasattr(ann, 'id')])
+            new_ann_ids = set([ann['id'] for ann in new_resource_annotations])
+            # Find annotations to add, update, or remove
+            annotations_to_add = [ann for ann in new_resource_annotations
+                                  if ann['id'] not in old_ann_ids]
+            annotations_to_remove = [ann for ann in old_resource_annotations
+                                     if getattr(ann, 'id', 'NA') not in new_ann_ids]
+            for ann in annotations_to_add:
+                filepath = self._get_annotation_file_path(ann)
+                if filepath is not None:  # None means it is not a segmentation
+                    # Collect for batch download
+                    filepath = Path(self.dataset_dir) / filepath
+                    filepath.parent.mkdir(parents=True, exist_ok=True)
+                    segmentations_to_download.append(ann)
+                    segmentation_paths.append(filepath)
+            # Process annotation changes
+            for ann in annotations_to_remove:
+                filepath = getattr(ann, 'file', None) if hasattr(ann, 'file') else ann.get('file', None)
+                if filepath is None:
+                    # Not a segmentation annotation
+                    continue
+                try:
+                    filepath = Path(self.dataset_dir) / filepath
+                    # delete the local annotation file if it exists
+                    if filepath.exists():
+                        os.remove(filepath)
+                except Exception as e:
+                    _LOGGER.error(f"Error deleting annotation file {filepath}: {e}")
+            # Update resource annotations list - convert to Annotation objects
+            resource['annotations'] = [Annotation.from_dict(ann) for ann in new_resource_annotations]
+        # Batch download all segmentation files
+        if segmentations_to_download:
+            _LOGGER.info(f"Downloading {len(segmentations_to_download)} segmentation files...")
+            self.api_handler.download_multiple_segmentations(segmentations_to_download, segmentation_paths)
+            _LOGGER.info(f"Downloaded {len(segmentations_to_download)} segmentation files.")
+        ###################
+        # update metadata
+        self.metainfo['updated_at'] = self._get_datasetinfo()['updated_at']
+        self.metainfo['all_annotations'] = self.all_annotations
+        # save updated metadata
+        datasetjson_path = os.path.join(self.dataset_dir, 'dataset.json')
+        with open(datasetjson_path, 'w') as file:
+            json.dump(self.metainfo, file, default=lambda o: o.to_dict() if hasattr(o, 'to_dict') else o)
+    def _get_resource_file_path(self, resource: dict) -> Path:
+        """Get the local file path for a resource."""
+        if 'file' in resource and resource['file'] is not None:
+            return Path(resource['file'])
+        else:
+            ext = guess_extension(resource['mimetype'], strict=False)
+            if ext is None:
+                _LOGGER.warning(f"Could not guess extension for resource {resource['id']}.")
+                ext = ''
+            return Path('images', f"{resource['id']}{ext}")
+    def _get_annotation_file_path(self, annotation: dict | Annotation) -> Path | None:
+        """Get the local file path for an annotation."""
+        if isinstance(annotation, Annotation):
+            if annotation.file:
+                return Path(annotation.file)
+            elif annotation.type == 'segmentation':
+                return Path('masks',
+                            annotation.created_by,
+                            annotation.resource_id,
+                            annotation.id)
+        else:
+            # Handle dict format for backwards compatibility
+            if 'file' in annotation:
+                return Path(annotation['file'])
+            elif annotation.get('annotation_type', annotation.get('type')) == 'segmentation':
+                return Path('masks',
+                            annotation['created_by'],
+                            annotation['resource_id'],
+                            annotation['id'])
+        return None
+    def _new_resource_created(self, resource: dict) -> None:
+        """Handle a new resource created in the dataset."""
+        if 'annotations' not in resource:
+            resource['annotations'] = []  # Initialize as empty list for Annotation objects
+        self.images_metainfo.append(resource)
+        if hasattr(self, 'num_frames_per_resource'):
+            raise NotImplementedError('Cannot handle new resources after dataset initialization')
+    def _resource_deleted(self, resource: dict) -> None:
+        """Handle a resource deleted from the dataset."""
+        # remove from metadata
+        for i, imginfo in enumerate(self.images_metainfo):
+            if imginfo['id'] == resource['id']:
+                deleted_metainfo = self.images_metainfo.pop(i)
+                break
+        else:
+            _LOGGER.warning(f"Resource {resource['id']} not found in dataset metadata.")
+            return
+        # delete from system file
+        if os.path.exists(deleted_metainfo['file']):
+            os.remove(os.path.join(self.dataset_dir, deleted_metainfo['file']))
+        # delete associated annotations
+        for ann in deleted_metainfo.get('annotations', []):
+            ann_file = getattr(ann, 'file', None) if hasattr(ann, 'file') else ann.get('file', None)
+            if ann_file is not None:
+                os.remove(os.path.join(self.dataset_dir, ann_file))
     def __add__(self, other):
+        """Concatenate datasets."""
         from torch.utils.data import ConcatDataset
         return ConcatDataset([self, other])
     def get_dataloader(self, *args, **kwargs) -> DataLoader:
-        """
-        Returns a DataLoader for the dataset.
-        This is a wrapper around the PyTorch DataLoader, with the convinience of using a nice collate_fn
-        that properly handles the different types of data in this dataset.
+        """Returns a DataLoader for the dataset with proper collate function.
         Args:
-            *args: Positional arguments for the DataLoader. See `torch.utils.data.DataLoader <https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader>`_ for details.
-            **kwargs: Keyword arguments for the DataLoader. See `torch.utils.data.DataLoader <https://pytorch.org/docs/stable/data.html#torch.utils.data.DataLoader>`_ for details.
+            *args: Positional arguments for the DataLoader.
+            **kwargs: Keyword arguments for the DataLoader.
+        Returns:
+            DataLoader instance with custom collate function.
         """
-        return DataLoader(self,
-                          *args,
-                          collate_fn=self.get_collate_fn(),
-                          **kwargs)
+        return DataLoader(self, *args, collate_fn=self.get_collate_fn(), **kwargs)
     def get_collate_fn(self) -> Callable:
-        def collate_fn(batch: dict) -> dict:
+        """Get collate function for DataLoader."""
+        def collate_fn(batch: list[dict]) -> dict:
+            if not batch:
+                return {}
             keys = batch[0].keys()
             collated_batch = {}
             for key in keys:
-                collated_batch[key] = [item[key] for item in batch]
-                if isinstance(collated_batch[key][0], torch.Tensor):
-                    # check if every tensor has the same shape
-                    shapes = [tensor.shape for tensor in collated_batch[key]]
+                values = [item[key] for item in batch]
+                if isinstance(values[0], torch.Tensor):
+                    shapes = [tensor.shape for tensor in values]
                     if all(shape == shapes[0] for shape in shapes):
-                        collated_batch[key] = torch.stack(collated_batch[key])
+                        collated_batch[key] = torch.stack(values)
                     else:
-                        _LOGGER.warning(f"Collating {key} tensors with different shapes: {shapes}. ")
-                elif isinstance(collated_batch[key][0], np.ndarray):
-                    collated_batch[key] = np.stack(collated_batch[key])
+                        _LOGGER.warning(f"Collating {key} tensors with different shapes: {shapes}")
+                        collated_batch[key] = values
+                elif isinstance(values[0], np.ndarray):
+                    collated_batch[key] = np.stack(values)
+                else:
+                    collated_batch[key] = values
             return collated_batch
         return collate_fn
     def subset(self, indices: list[int]) -> 'DatamintBaseDataset':
-        if len(self.subset_indices) > self.dataset_length:
+        """Create a subset of the dataset.
+        Args:
+            indices: List of indices to include in the subset.
+        Returns:
+            Self with updated subset indices.
+        """
+        if max(indices, default=-1) >= self.dataset_length:
             raise ValueError(f"Subset indices must be less than the dataset length: {self.dataset_length}")
         self.subset_indices = indices
         return self
     def _should_include_annotator(self, annotator_id: str) -> bool:
-        """
-        Check if an annotator should be included based on the filtering settings.
-        Args:
-            annotator_id: The ID of the annotator to check
-        Returns:
-            bool: True if the annotator should be included, False otherwise
-        """
+        """Check if an annotator should be included based on filtering settings."""
         if self.include_annotators is not None:
             return annotator_id in self.include_annotators
         if self.exclude_annotators is not None:
@@ -839,15 +1115,7 @@ class DatamintBaseDataset:
         return True
     def _should_include_segmentation(self, segmentation_name: str) -> bool:
-        """
-        Check if a segmentation should be included based on the filtering settings.
-        Args:
-            segmentation_name: The name of the segmentation to check
-        Returns:
-            bool: True if the segmentation should be included, False otherwise
-        """
+        """Check if a segmentation should be included based on filtering settings."""
         if self.include_segmentation_names is not None:
             return segmentation_name in self.include_segmentation_names
         if self.exclude_segmentation_names is not None:
@@ -855,15 +1123,7 @@ class DatamintBaseDataset:
         return True
     def _should_include_image_label(self, label_name: str) -> bool:
-        """
-        Check if an image label should be included based on the filtering settings.
-        Args:
-            label_name: The name of the image label to check
-        Returns:
-            bool: True if the image label should be included, False otherwise
-        """
+        """Check if an image label should be included based on filtering settings."""
         if self.include_image_label_names is not None:
             return label_name in self.include_image_label_names
         if self.exclude_image_label_names is not None:
@@ -871,15 +1131,7 @@ class DatamintBaseDataset:
         return True
     def _should_include_frame_label(self, label_name: str) -> bool:
-        """
-        Check if a frame label should be included based on the filtering settings.
-        Args:
-            label_name: The name of the frame label to check
-        Returns:
-            bool: True if the frame label should be included, False otherwise
-        """
+        """Check if a frame label should be included based on filtering settings."""
         if self.include_frame_label_names is not None:
             return label_name in self.include_frame_label_names
         if self.exclude_frame_label_names is not None:

datamint 1.6.3.post1__py3-none-any.whl → 1.7.0__py3-none-any.whl

Potentially problematic release.

datamint 1.6.3.post1py3-none-any.whl → 1.7.0py3-none-any.whl