PyPI - sleap-nn - Versions diffs - 0.0.5__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

sleap-nn 0.0.5py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

sleap_nn/__init__.py +9 -2
sleap_nn/architectures/convnext.py +5 -0
sleap_nn/architectures/encoder_decoder.py +25 -6
sleap_nn/architectures/swint.py +8 -0
sleap_nn/cli.py +489 -46
sleap_nn/config/data_config.py +51 -8
sleap_nn/config/get_config.py +32 -24
sleap_nn/config/trainer_config.py +88 -0
sleap_nn/data/augmentation.py +61 -200
sleap_nn/data/custom_datasets.py +433 -61
sleap_nn/data/instance_cropping.py +71 -6
sleap_nn/data/normalization.py +45 -2
sleap_nn/data/providers.py +26 -0
sleap_nn/data/resizing.py +2 -2
sleap_nn/data/skia_augmentation.py +414 -0
sleap_nn/data/utils.py +135 -17
sleap_nn/evaluation.py +177 -42
sleap_nn/export/__init__.py +21 -0
sleap_nn/export/cli.py +1778 -0
sleap_nn/export/exporters/__init__.py +51 -0
sleap_nn/export/exporters/onnx_exporter.py +80 -0
sleap_nn/export/exporters/tensorrt_exporter.py +291 -0
sleap_nn/export/metadata.py +225 -0
sleap_nn/export/predictors/__init__.py +63 -0
sleap_nn/export/predictors/base.py +22 -0
sleap_nn/export/predictors/onnx.py +154 -0
sleap_nn/export/predictors/tensorrt.py +312 -0
sleap_nn/export/utils.py +307 -0
sleap_nn/export/wrappers/__init__.py +25 -0
sleap_nn/export/wrappers/base.py +96 -0
sleap_nn/export/wrappers/bottomup.py +243 -0
sleap_nn/export/wrappers/bottomup_multiclass.py +195 -0
sleap_nn/export/wrappers/centered_instance.py +56 -0
sleap_nn/export/wrappers/centroid.py +58 -0
sleap_nn/export/wrappers/single_instance.py +83 -0
sleap_nn/export/wrappers/topdown.py +180 -0
sleap_nn/export/wrappers/topdown_multiclass.py +304 -0
sleap_nn/inference/__init__.py +6 -0
sleap_nn/inference/bottomup.py +86 -20
sleap_nn/inference/peak_finding.py +93 -16
sleap_nn/inference/postprocessing.py +284 -0
sleap_nn/inference/predictors.py +339 -137
sleap_nn/inference/provenance.py +292 -0
sleap_nn/inference/topdown.py +55 -47
sleap_nn/legacy_models.py +65 -11
sleap_nn/predict.py +224 -19
sleap_nn/system_info.py +443 -0
sleap_nn/tracking/tracker.py +8 -1
sleap_nn/train.py +138 -44
sleap_nn/training/callbacks.py +1258 -5
sleap_nn/training/lightning_modules.py +902 -220
sleap_nn/training/model_trainer.py +424 -111
sleap_nn/training/schedulers.py +191 -0
sleap_nn/training/utils.py +367 -2
{sleap_nn-0.0.5.dist-info → sleap_nn-0.1.0.dist-info}/METADATA +35 -33
sleap_nn-0.1.0.dist-info/RECORD +88 -0
{sleap_nn-0.0.5.dist-info → sleap_nn-0.1.0.dist-info}/WHEEL +1 -1
sleap_nn-0.0.5.dist-info/RECORD +0 -63
{sleap_nn-0.0.5.dist-info → sleap_nn-0.1.0.dist-info}/entry_points.txt +0 -0
{sleap_nn-0.0.5.dist-info → sleap_nn-0.1.0.dist-info}/licenses/LICENSE +0 -0
{sleap_nn-0.0.5.dist-info → sleap_nn-0.1.0.dist-info}/top_level.txt +0 -0

sleap_nn/data/custom_datasets.py CHANGED Viewed

@@ -1,10 +1,11 @@
 """Custom `torch.utils.data.Dataset`s for different model types."""
-from kornia.geometry.transform import crop_and_resize
+from sleap_nn.data.skia_augmentation import crop_and_resize_skia as crop_and_resize
-# from concurrent.futures import ThreadPoolExecutor # TODO: implement parallel processing
-# import concurrent.futures
-# import os
+import os
+import threading
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from copy import deepcopy
 from itertools import cycle
 from pathlib import Path
 import torch.distributed as dist
@@ -13,6 +14,14 @@ from omegaconf import DictConfig, OmegaConf
 import numpy as np
 from PIL import Image
 from loguru import logger
+from rich.progress import (
+    Progress,
+    SpinnerColumn,
+    TextColumn,
+    BarColumn,
+    TimeElapsedColumn,
+)
+from rich.console import Console
 import torch
 import torchvision.transforms as T
 from torch.utils.data import Dataset, DataLoader, DistributedSampler
@@ -22,7 +31,6 @@ from sleap_nn.data.identity import generate_class_maps, make_class_vectors
 from sleap_nn.data.instance_centroids import generate_centroids
 from sleap_nn.data.instance_cropping import generate_crops
 from sleap_nn.data.normalization import (
-    apply_normalization,
     convert_to_grayscale,
     convert_to_rgb,
 )
@@ -38,6 +46,182 @@ from sleap_nn.data.instance_cropping import make_centered_bboxes
 from sleap_nn.training.utils import is_distributed_initialized
 from sleap_nn.config.get_config import get_aug_config
+# Minimum number of samples to use parallel caching (overhead not worth it for smaller)
+MIN_SAMPLES_FOR_PARALLEL_CACHING = 20
+class ParallelCacheFiller:
+    """Parallel implementation of image caching using thread-local video copies.
+    This class uses ThreadPoolExecutor to parallelize I/O-bound operations when
+    caching images to disk or memory. Each worker thread gets its own copy of
+    video objects to ensure thread safety.
+    Attributes:
+        labels: List of sio.Labels objects containing the data.
+        lf_idx_list: List of dictionaries with labeled frame indices.
+        cache_type: Either "disk" or "memory".
+        cache_path: Path to save cached images (for disk caching).
+        num_workers: Number of worker threads.
+    """
+    def __init__(
+        self,
+        labels: List[sio.Labels],
+        lf_idx_list: List[Dict],
+        cache_type: str,
+        cache_path: Optional[Path] = None,
+        num_workers: int = 4,
+    ):
+        """Initialize the parallel cache filler.
+        Args:
+            labels: List of sio.Labels objects.
+            lf_idx_list: List of sample dictionaries with frame indices.
+            cache_type: Either "disk" or "memory".
+            cache_path: Path for disk caching.
+            num_workers: Number of worker threads.
+        """
+        self.labels = labels
+        self.lf_idx_list = lf_idx_list
+        self.cache_type = cache_type
+        self.cache_path = cache_path
+        self.num_workers = num_workers
+        self.cache: Dict = {}
+        self._cache_lock = threading.Lock()
+        self._local = threading.local()
+        self._video_info: Dict = {}
+        # Prepare video copies for thread-local access
+        self._prepare_video_copies()
+    def _prepare_video_copies(self):
+        """Close original videos and prepare for thread-local copies."""
+        for label in self.labels:
+            for video in label.videos:
+                vid_id = id(video)
+                if vid_id not in self._video_info:
+                    # Store original state
+                    original_open_backend = video.open_backend
+                    # Close the video backend
+                    video.close()
+                    video.open_backend = False
+                    self._video_info[vid_id] = {
+                        "video": video,
+                        "original_open_backend": original_open_backend,
+                    }
+    def _get_thread_local_video(self, video: sio.Video) -> sio.Video:
+        """Get or create a thread-local video copy.
+        Args:
+            video: The original video object.
+        Returns:
+            A thread-local copy of the video that is safe to use.
+        """
+        vid_id = id(video)
+        if not hasattr(self._local, "videos"):
+            self._local.videos = {}
+        if vid_id not in self._local.videos:
+            # Create a thread-local copy
+            video_copy = deepcopy(video)
+            video_copy.open_backend = True
+            self._local.videos[vid_id] = video_copy
+        return self._local.videos[vid_id]
+    def _process_sample(
+        self, sample: Dict
+    ) -> Tuple[int, int, Optional[np.ndarray], Optional[str]]:
+        """Process a single sample (read image, optionally save/cache).
+        Args:
+            sample: Dictionary with labels_idx, lf_idx, etc.
+        Returns:
+            Tuple of (labels_idx, lf_idx, image_or_none, error_or_none).
+        """
+        labels_idx = sample["labels_idx"]
+        lf_idx = sample["lf_idx"]
+        try:
+            # Get the labeled frame
+            lf = self.labels[labels_idx][lf_idx]
+            # Get thread-local video
+            video = self._get_thread_local_video(lf.video)
+            # Read the image
+            img = video[lf.frame_idx]
+            if img.shape[-1] == 1:
+                img = np.squeeze(img)
+            if self.cache_type == "disk":
+                f_name = self.cache_path / f"sample_{labels_idx}_{lf_idx}.jpg"
+                Image.fromarray(img).save(str(f_name), format="JPEG")
+                return labels_idx, lf_idx, None, None
+            elif self.cache_type == "memory":
+                return labels_idx, lf_idx, img, None
+        except Exception as e:
+            return labels_idx, lf_idx, None, f"{type(e).__name__}: {str(e)}"
+    def fill_cache(
+        self, progress_callback=None
+    ) -> Tuple[Dict, List[Tuple[int, int, str]]]:
+        """Fill the cache in parallel.
+        Args:
+            progress_callback: Optional callback(completed_count) for progress updates.
+        Returns:
+            Tuple of (cache_dict, list_of_errors).
+        """
+        errors = []
+        completed = 0
+        with ThreadPoolExecutor(max_workers=self.num_workers) as executor:
+            futures = {
+                executor.submit(self._process_sample, sample): sample
+                for sample in self.lf_idx_list
+            }
+            for future in as_completed(futures):
+                labels_idx, lf_idx, img, error = future.result()
+                if error:
+                    errors.append((labels_idx, lf_idx, error))
+                elif self.cache_type == "memory" and img is not None:
+                    with self._cache_lock:
+                        self.cache[(labels_idx, lf_idx)] = img
+                completed += 1
+                if progress_callback:
+                    progress_callback(completed)
+        # Restore original video states
+        self._restore_videos()
+        return self.cache, errors
+    def _restore_videos(self):
+        """Restore original video states after caching is complete."""
+        for vid_info in self._video_info.values():
+            video = vid_info["video"]
+            video.open_backend = vid_info["original_open_backend"]
+            if video.open_backend:
+                try:
+                    video.open()
+                except Exception:
+                    pass
 class BaseDataset(Dataset):
     """Base class for custom torch Datasets.
@@ -76,6 +260,8 @@ class BaseDataset(Dataset):
         use_existing_imgs: Use existing imgs/ chunks in the `cache_img_path`.
         rank: Indicates the rank of the process. Used during distributed training to ensure that image storage to
             disk occurs only once across all workers.
+        parallel_caching: If True, use parallel processing for caching (faster for large datasets). Default: True.
+        cache_workers: Number of worker threads for parallel caching. If 0, uses min(4, cpu_count). Default: 0.
         labels_list: List of `sio.Labels` objects. Used to store the labels in the cache. (only used if `cache_img` is `None`)
     """
@@ -95,6 +281,8 @@ class BaseDataset(Dataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__()
@@ -135,6 +323,8 @@ class BaseDataset(Dataset):
         self.cache_img = cache_img
         self.cache_img_path = cache_img_path
         self.use_existing_imgs = use_existing_imgs
+        self.parallel_caching = parallel_caching
+        self.cache_workers = cache_workers
         if self.cache_img is not None and "disk" in self.cache_img:
             if self.cache_img_path is None:
                 self.cache_img_path = "."
@@ -160,10 +350,18 @@ class BaseDataset(Dataset):
         if self.cache_img is not None:
             if self.cache_img == "memory":
-                self._fill_cache(labels)
+                self._fill_cache(
+                    labels,
+                    parallel=self.parallel_caching,
+                    num_workers=self.cache_workers,
+                )
             elif self.cache_img == "disk" and not self.use_existing_imgs:
                 if self.rank is None or self.rank == -1 or self.rank == 0:
-                    self._fill_cache(labels)
+                    self._fill_cache(
+                        labels,
+                        parallel=self.parallel_caching,
+                        num_workers=self.cache_workers,
+                    )
                 # Synchronize all ranks after cache creation
                 if is_distributed_initialized():
                     dist.barrier()
@@ -177,6 +375,9 @@ class BaseDataset(Dataset):
                 if self.user_instances_only:
                     if lf.user_instances is not None and len(lf.user_instances) > 0:
                         lf.instances = lf.user_instances
+                    else:
+                        # Skip frames without user instances
+                        continue
                 is_empty = True
                 for _, inst in enumerate(lf.instances):
                     if not inst.is_empty:  # filter all NaN instances.
@@ -209,20 +410,160 @@ class BaseDataset(Dataset):
         """Returns an iterator."""
         return self
-    def _fill_cache(self, labels: List[sio.Labels]):
-        """Load all samples to cache."""
-        # TODO: Implement parallel processing (using threads might cause error with MediaVideo backend)
-        for sample in self.lf_idx_list:
-            labels_idx = sample["labels_idx"]
-            lf_idx = sample["lf_idx"]
-            img = labels[labels_idx][lf_idx].image
-            if img.shape[-1] == 1:
-                img = np.squeeze(img)
-            if self.cache_img == "disk":
-                f_name = f"{self.cache_img_path}/sample_{labels_idx}_{lf_idx}.jpg"
-                Image.fromarray(img).save(f_name, format="JPEG")
-            if self.cache_img == "memory":
-                self.cache[(labels_idx, lf_idx)] = img
+    def _fill_cache(
+        self,
+        labels: List[sio.Labels],
+        parallel: bool = True,
+        num_workers: int = 0,
+    ):
+        """Load all samples to cache.
+        Args:
+            labels: List of sio.Labels objects containing the data.
+            parallel: If True, use parallel processing for caching (faster for large
+                datasets). Default: True.
+            num_workers: Number of worker threads for parallel caching. If 0, uses
+                min(4, cpu_count). Default: 0.
+        """
+        total_samples = len(self.lf_idx_list)
+        cache_type = "disk" if self.cache_img == "disk" else "memory"
+        # Check for NO_COLOR env var to disable progress bar
+        no_color = (
+            os.environ.get("NO_COLOR") is not None
+            or os.environ.get("FORCE_COLOR") == "0"
+        )
+        use_progress = not no_color
+        # Use parallel caching for larger datasets
+        use_parallel = parallel and total_samples >= MIN_SAMPLES_FOR_PARALLEL_CACHING
+        logger.info(f"Caching {total_samples} images to {cache_type}...")
+        if use_parallel:
+            self._fill_cache_parallel(
+                labels, total_samples, cache_type, use_progress, num_workers
+            )
+        else:
+            self._fill_cache_sequential(labels, total_samples, cache_type, use_progress)
+        logger.info(f"Caching complete.")
+    def _fill_cache_sequential(
+        self,
+        labels: List[sio.Labels],
+        total_samples: int,
+        cache_type: str,
+        use_progress: bool,
+    ):
+        """Sequential implementation of cache filling.
+        Args:
+            labels: List of sio.Labels objects.
+            total_samples: Total number of samples to cache.
+            cache_type: Either "disk" or "memory".
+            use_progress: Whether to show a progress bar.
+        """
+        def process_samples(progress=None, task=None):
+            for sample in self.lf_idx_list:
+                labels_idx = sample["labels_idx"]
+                lf_idx = sample["lf_idx"]
+                img = labels[labels_idx][lf_idx].image
+                if img.shape[-1] == 1:
+                    img = np.squeeze(img)
+                if self.cache_img == "disk":
+                    f_name = f"{self.cache_img_path}/sample_{labels_idx}_{lf_idx}.jpg"
+                    Image.fromarray(img).save(f_name, format="JPEG")
+                if self.cache_img == "memory":
+                    self.cache[(labels_idx, lf_idx)] = img
+                if progress is not None:
+                    progress.update(task, advance=1)
+        if use_progress:
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                BarColumn(),
+                TextColumn("{task.completed}/{task.total}"),
+                TimeElapsedColumn(),
+                console=Console(force_terminal=True),
+                transient=True,
+            ) as progress:
+                task = progress.add_task(
+                    f"Caching images to {cache_type}", total=total_samples
+                )
+                process_samples(progress, task)
+        else:
+            process_samples()
+    def _fill_cache_parallel(
+        self,
+        labels: List[sio.Labels],
+        total_samples: int,
+        cache_type: str,
+        use_progress: bool,
+        num_workers: int = 0,
+    ):
+        """Parallel implementation of cache filling using thread-local video copies.
+        Args:
+            labels: List of sio.Labels objects.
+            total_samples: Total number of samples to cache.
+            cache_type: Either "disk" or "memory".
+            use_progress: Whether to show a progress bar.
+            num_workers: Number of worker threads. If 0, uses min(4, cpu_count).
+        """
+        # Determine number of workers
+        if num_workers <= 0:
+            num_workers = min(4, os.cpu_count() or 1)
+        cache_path = Path(self.cache_img_path) if self.cache_img_path else None
+        filler = ParallelCacheFiller(
+            labels=labels,
+            lf_idx_list=self.lf_idx_list,
+            cache_type=cache_type,
+            cache_path=cache_path,
+            num_workers=num_workers,
+        )
+        if use_progress:
+            with Progress(
+                SpinnerColumn(),
+                TextColumn("[progress.description]{task.description}"),
+                BarColumn(),
+                TextColumn("{task.completed}/{task.total}"),
+                TimeElapsedColumn(),
+                console=Console(force_terminal=True),
+                transient=True,
+            ) as progress:
+                task = progress.add_task(
+                    f"Caching images to {cache_type} (parallel, {num_workers} workers)",
+                    total=total_samples,
+                )
+                def progress_callback(completed):
+                    progress.update(task, completed=completed)
+                cache, errors = filler.fill_cache(progress_callback)
+        else:
+            logger.info(
+                f"Caching {total_samples} images to {cache_type} "
+                f"(parallel, {num_workers} workers)..."
+            )
+            cache, errors = filler.fill_cache()
+        # Update instance cache
+        if cache_type == "memory":
+            self.cache.update(cache)
+        # Log any errors
+        if errors:
+            logger.warning(
+                f"Parallel caching completed with {len(errors)} errors. "
+                f"First error: {errors[0]}"
+            )
     def __len__(self) -> int:
         """Return the number of samples in the dataset."""
@@ -298,6 +639,8 @@ class BottomUpDataset(BaseDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -315,6 +658,8 @@ class BottomUpDataset(BaseDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.confmap_head_config = confmap_head_config
         self.pafs_head_config = pafs_head_config
@@ -357,9 +702,6 @@ class BottomUpDataset(BaseDataset):
             user_instances_only=self.user_instances_only,
         )
-        # apply normalization
-        sample["image"] = apply_normalization(sample["image"])
         if self.ensure_rgb:
             sample["image"] = convert_to_rgb(sample["image"])
         elif self.ensure_grayscale:
@@ -497,6 +839,8 @@ class BottomUpMultiClassDataset(BaseDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -514,6 +858,8 @@ class BottomUpMultiClassDataset(BaseDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.confmap_head_config = confmap_head_config
         self.class_maps_head_config = class_maps_head_config
@@ -570,9 +916,6 @@ class BottomUpMultiClassDataset(BaseDataset):
         sample["num_tracks"] = torch.tensor(len(self.class_names), dtype=torch.int32)
-        # apply normalization
-        sample["image"] = apply_normalization(sample["image"])
         if self.ensure_rgb:
             sample["image"] = convert_to_rgb(sample["image"])
         elif self.ensure_grayscale:
@@ -684,15 +1027,12 @@ class CenteredInstanceDataset(BaseDataset):
             the images aren't cached and loaded from the `.slp` file on each access.
         cache_img_path: Path to save the `.jpg` files. If `None`, current working dir is used.
         use_existing_imgs: Use existing imgs/ chunks in the `cache_img_path`.
-        crop_size: Crop size of each instance for centered-instance model.
+        crop_size: Crop size of each instance for centered-instance model. If `scale` is provided, then the cropped image will be resized according to `scale`.
         rank: Indicates the rank of the process. Used during distributed training to ensure that image storage to
             disk occurs only once across all workers.
         confmap_head_config: DictConfig object with all the keys in the `head_config` section.
             (required keys: `sigma`, `output_stride`, `part_names` and `anchor_part` depending on the model type ).
         labels_list: List of `sio.Labels` objects. Used to store the labels in the cache. (only used if `cache_img` is `None`)
-    Note: If scale is provided for centered-instance model, the images are cropped out
-    from the scaled image with the given crop size.
     """
     def __init__(
@@ -714,6 +1054,8 @@ class CenteredInstanceDataset(BaseDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -731,6 +1073,8 @@ class CenteredInstanceDataset(BaseDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.labels = None
         self.crop_size = crop_size
@@ -748,6 +1092,9 @@ class CenteredInstanceDataset(BaseDataset):
                 if self.user_instances_only:
                     if lf.user_instances is not None and len(lf.user_instances) > 0:
                         lf.instances = lf.user_instances
+                    else:
+                        # Skip frames without user instances
+                        continue
                 for inst_idx, inst in enumerate(lf.instances):
                     if not inst.is_empty:  # filter all NaN instances.
                         video_idx = labels[labels_idx].videos.index(lf.video)
@@ -818,9 +1165,6 @@ class CenteredInstanceDataset(BaseDataset):
         instances = instances[:, inst_idx]
-        # apply normalization
-        image = apply_normalization(image)
         if self.ensure_rgb:
             image = convert_to_rgb(image)
         elif self.ensure_grayscale:
@@ -834,13 +1178,6 @@ class CenteredInstanceDataset(BaseDataset):
         )
         instances = instances * eff_scale
-        # resize image
-        image, instances = apply_resizer(
-            image,
-            instances,
-            scale=self.scale,
-        )
         # get the centroids based on the anchor idx
         centroids = generate_centroids(instances, anchor_ind=self.anchor_ind)
@@ -901,6 +1238,13 @@ class CenteredInstanceDataset(BaseDataset):
         sample["instance"] = center_instance  # (n_samples=1, n_nodes, 2)
         sample["centroid"] = centered_centroid  # (n_samples=1, 2)
+        # resize the cropped image
+        sample["instance_image"], sample["instance"] = apply_resizer(
+            sample["instance_image"],
+            sample["instance"],
+            scale=self.scale,
+        )
         # Pad the image (if needed) according max stride
         sample["instance_image"] = apply_pad_to_stride(
             sample["instance_image"], max_stride=self.max_stride
@@ -959,7 +1303,7 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
             the images aren't cached and loaded from the `.slp` file on each access.
         cache_img_path: Path to save the `.jpg` files. If `None`, current working dir is used.
         use_existing_imgs: Use existing imgs/ chunks in the `cache_img_path`.
-        crop_size: Crop size of each instance for centered-instance model.
+        crop_size: Crop size of each instance for centered-instance model. If `scale` is provided, then the cropped image will be resized according to `scale`.
         rank: Indicates the rank of the process. Used during distributed training to ensure that image storage to
             disk occurs only once across all workers.
         confmap_head_config: DictConfig object with all the keys in the `head_config` section.
@@ -967,9 +1311,6 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
         class_vectors_head_config: DictConfig object with all the keys in the `head_config` section.
             (required keys: `classes`, `num_fc_layers`, `num_fc_units`, `output_stride`, `loss_weight`).
         labels_list: List of `sio.Labels` objects. Used to store the labels in the cache. (only used if `cache_img` is `None`)
-    Note: If scale is provided for centered-instance model, the images are cropped out
-    from the scaled image with the given crop size.
     """
     def __init__(
@@ -992,6 +1333,8 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -1012,6 +1355,8 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.class_vectors_head_config = class_vectors_head_config
         self.class_names = self.class_vectors_head_config.classes
@@ -1066,9 +1411,6 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
         instances = instances[:, inst_idx]
-        # apply normalization
-        image = apply_normalization(image)
         if self.ensure_rgb:
             image = convert_to_rgb(image)
         elif self.ensure_grayscale:
@@ -1082,13 +1424,6 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
         )
         instances = instances * eff_scale
-        # resize image
-        image, instances = apply_resizer(
-            image,
-            instances,
-            scale=self.scale,
-        )
         # get class vectors
         track_ids = torch.Tensor(
             [
@@ -1165,6 +1500,13 @@ class TopDownCenteredInstanceMultiClassDataset(CenteredInstanceDataset):
         sample["instance"] = center_instance  # (n_samples=1, n_nodes, 2)
         sample["centroid"] = centered_centroid  # (n_samples=1, 2)
+        # resize image
+        sample["instance_image"], sample["instance"] = apply_resizer(
+            sample["instance_image"],
+            sample["instance"],
+            scale=self.scale,
+        )
         # Pad the image (if needed) according max stride
         sample["instance_image"] = apply_pad_to_stride(
             sample["instance_image"], max_stride=self.max_stride
@@ -1250,6 +1592,8 @@ class CentroidDataset(BaseDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -1267,6 +1611,8 @@ class CentroidDataset(BaseDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.anchor_ind = anchor_ind
         self.confmap_head_config = confmap_head_config
@@ -1306,9 +1652,6 @@ class CentroidDataset(BaseDataset):
             user_instances_only=self.user_instances_only,
         )
-        # apply normalization
-        sample["image"] = apply_normalization(sample["image"])
         if self.ensure_rgb:
             sample["image"] = convert_to_rgb(sample["image"])
         elif self.ensure_grayscale:
@@ -1433,6 +1776,8 @@ class SingleInstanceDataset(BaseDataset):
         cache_img_path: Optional[str] = None,
         use_existing_imgs: bool = False,
         rank: Optional[int] = None,
+        parallel_caching: bool = True,
+        cache_workers: int = 0,
     ) -> None:
         """Initialize class attributes."""
         super().__init__(
@@ -1450,6 +1795,8 @@ class SingleInstanceDataset(BaseDataset):
             cache_img_path=cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         self.confmap_head_config = confmap_head_config
@@ -1488,9 +1835,6 @@ class SingleInstanceDataset(BaseDataset):
             user_instances_only=self.user_instances_only,
         )
-        # apply normalization
-        sample["image"] = apply_normalization(sample["image"])
         if self.ensure_rgb:
             sample["image"] = convert_to_rgb(sample["image"])
         elif self.ensure_grayscale:
@@ -1671,6 +2015,10 @@ def get_train_val_datasets(
         val_cache_img_path = Path(base_cache_img_path) / "val_imgs"
     use_existing_imgs = config.data_config.use_existing_imgs
+    # Parallel caching configuration
+    parallel_caching = getattr(config.data_config, "parallel_caching", True)
+    cache_workers = getattr(config.data_config, "cache_workers", 0)
     model_type = get_model_type_from_cfg(config=config)
     backbone_type = get_backbone_type_from_cfg(config=config)
@@ -1724,6 +2072,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = BottomUpDataset(
             labels=val_labels,
@@ -1747,6 +2097,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     elif model_type == "multi_class_bottomup":
@@ -1780,6 +2132,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = BottomUpMultiClassDataset(
             labels=val_labels,
@@ -1803,6 +2157,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     elif model_type == "centered_instance":
@@ -1842,6 +2198,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = CenteredInstanceDataset(
             labels=val_labels,
@@ -1866,6 +2224,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     elif model_type == "multi_class_topdown":
@@ -1906,6 +2266,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = TopDownCenteredInstanceMultiClassDataset(
             labels=val_labels,
@@ -1931,6 +2293,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     elif model_type == "centroid":
@@ -1967,6 +2331,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = CentroidDataset(
             labels=val_labels,
@@ -1990,6 +2356,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     else:
@@ -2022,6 +2390,8 @@ def get_train_val_datasets(
             cache_img_path=train_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
         val_dataset = SingleInstanceDataset(
             labels=val_labels,
@@ -2044,6 +2414,8 @@ def get_train_val_datasets(
             cache_img_path=val_cache_img_path,
             use_existing_imgs=use_existing_imgs,
             rank=rank,
+            parallel_caching=parallel_caching,
+            cache_workers=cache_workers,
         )
     # If using caching, close the videos to prevent `h5py objects can't be pickled error` when num_workers > 0.

sleap-nn 0.0.5__py3-none-any.whl → 0.1.0__py3-none-any.whl

sleap-nn 0.0.5py3-none-any.whl → 0.1.0py3-none-any.whl