PyPI - kaiko-eva - Versions diffs - 0.1.8__py3-none-any.whl → 0.2.1__py3-none-any.whl - Mend

kaiko-eva 0.1.8py3-none-any.whl → 0.2.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

eva/core/data/datasets/base.py +7 -2
eva/core/data/datasets/classification/embeddings.py +2 -2
eva/core/data/datasets/classification/multi_embeddings.py +2 -2
eva/core/data/datasets/embeddings.py +4 -4
eva/core/data/samplers/classification/balanced.py +19 -18
eva/core/loggers/utils/wandb.py +33 -0
eva/core/models/modules/head.py +5 -3
eva/core/models/modules/typings.py +2 -2
eva/core/models/transforms/__init__.py +2 -1
eva/core/models/transforms/as_discrete.py +57 -0
eva/core/models/wrappers/_utils.py +121 -1
eva/core/trainers/functional.py +8 -5
eva/core/trainers/trainer.py +32 -17
eva/core/utils/suppress_logs.py +28 -0
eva/vision/data/__init__.py +2 -2
eva/vision/data/dataloaders/__init__.py +5 -0
eva/vision/data/dataloaders/collate_fn/__init__.py +5 -0
eva/vision/data/dataloaders/collate_fn/collection.py +22 -0
eva/vision/data/datasets/__init__.py +10 -2
eva/vision/data/datasets/classification/__init__.py +9 -0
eva/vision/data/datasets/classification/bach.py +3 -4
eva/vision/data/datasets/classification/bracs.py +111 -0
eva/vision/data/datasets/classification/breakhis.py +209 -0
eva/vision/data/datasets/classification/camelyon16.py +4 -5
eva/vision/data/datasets/classification/crc.py +3 -4
eva/vision/data/datasets/classification/gleason_arvaniti.py +171 -0
eva/vision/data/datasets/classification/mhist.py +3 -4
eva/vision/data/datasets/classification/panda.py +4 -5
eva/vision/data/datasets/classification/patch_camelyon.py +3 -4
eva/vision/data/datasets/classification/unitopatho.py +158 -0
eva/vision/data/datasets/classification/wsi.py +6 -5
eva/vision/data/datasets/segmentation/__init__.py +2 -2
eva/vision/data/datasets/segmentation/_utils.py +47 -0
eva/vision/data/datasets/segmentation/bcss.py +7 -8
eva/vision/data/datasets/segmentation/btcv.py +236 -0
eva/vision/data/datasets/segmentation/consep.py +6 -7
eva/vision/data/datasets/segmentation/embeddings.py +2 -2
eva/vision/data/datasets/segmentation/lits.py +9 -8
eva/vision/data/datasets/segmentation/lits_balanced.py +2 -1
eva/vision/data/datasets/segmentation/monusac.py +4 -5
eva/vision/data/datasets/segmentation/total_segmentator_2d.py +12 -10
eva/vision/data/datasets/vision.py +95 -4
eva/vision/data/datasets/wsi.py +5 -5
eva/vision/data/transforms/__init__.py +22 -3
eva/vision/data/transforms/common/__init__.py +1 -2
eva/vision/data/transforms/croppad/__init__.py +11 -0
eva/vision/data/transforms/croppad/crop_foreground.py +110 -0
eva/vision/data/transforms/croppad/rand_crop_by_pos_neg_label.py +109 -0
eva/vision/data/transforms/croppad/spatial_pad.py +67 -0
eva/vision/data/transforms/intensity/__init__.py +11 -0
eva/vision/data/transforms/intensity/rand_scale_intensity.py +59 -0
eva/vision/data/transforms/intensity/rand_shift_intensity.py +55 -0
eva/vision/data/transforms/intensity/scale_intensity_ranged.py +56 -0
eva/vision/data/transforms/spatial/__init__.py +7 -0
eva/vision/data/transforms/spatial/flip.py +72 -0
eva/vision/data/transforms/spatial/rotate.py +53 -0
eva/vision/data/transforms/spatial/spacing.py +69 -0
eva/vision/data/transforms/utility/__init__.py +5 -0
eva/vision/data/transforms/utility/ensure_channel_first.py +51 -0
eva/vision/data/tv_tensors/__init__.py +5 -0
eva/vision/data/tv_tensors/volume.py +61 -0
eva/vision/metrics/segmentation/monai_dice.py +9 -2
eva/vision/models/modules/semantic_segmentation.py +28 -20
eva/vision/models/networks/backbones/__init__.py +9 -2
eva/vision/models/networks/backbones/pathology/__init__.py +11 -2
eva/vision/models/networks/backbones/pathology/bioptimus.py +47 -1
eva/vision/models/networks/backbones/pathology/hkust.py +69 -0
eva/vision/models/networks/backbones/pathology/kaiko.py +18 -0
eva/vision/models/networks/backbones/pathology/mahmood.py +46 -19
eva/vision/models/networks/backbones/radiology/__init__.py +11 -0
eva/vision/models/networks/backbones/radiology/swin_unetr.py +231 -0
eva/vision/models/networks/backbones/radiology/voco.py +75 -0
eva/vision/models/networks/decoders/segmentation/__init__.py +6 -2
eva/vision/models/networks/decoders/segmentation/linear.py +5 -10
eva/vision/models/networks/decoders/segmentation/semantic/__init__.py +8 -1
eva/vision/models/networks/decoders/segmentation/semantic/swin_unetr.py +104 -0
eva/vision/utils/io/__init__.py +2 -0
eva/vision/utils/io/nifti.py +91 -11
{kaiko_eva-0.1.8.dist-info → kaiko_eva-0.2.1.dist-info}/METADATA +3 -1
{kaiko_eva-0.1.8.dist-info → kaiko_eva-0.2.1.dist-info}/RECORD +83 -62
{kaiko_eva-0.1.8.dist-info → kaiko_eva-0.2.1.dist-info}/WHEEL +1 -1
eva/vision/data/datasets/classification/base.py +0 -96
eva/vision/data/datasets/segmentation/base.py +0 -96
eva/vision/data/transforms/common/resize_and_clamp.py +0 -51
eva/vision/data/transforms/normalization/__init__.py +0 -6
eva/vision/data/transforms/normalization/clamp.py +0 -43
eva/vision/data/transforms/normalization/functional/__init__.py +0 -5
eva/vision/data/transforms/normalization/functional/rescale_intensity.py +0 -28
eva/vision/data/transforms/normalization/rescale_intensity.py +0 -53
eva/vision/metrics/segmentation/BUILD +0 -1
eva/vision/models/networks/backbones/torchhub/__init__.py +0 -5
eva/vision/models/networks/backbones/torchhub/backbones.py +0 -61
{kaiko_eva-0.1.8.dist-info → kaiko_eva-0.2.1.dist-info}/entry_points.txt +0 -0
{kaiko_eva-0.1.8.dist-info → kaiko_eva-0.2.1.dist-info}/licenses/LICENSE +0 -0

eva/vision/data/datasets/classification/unitopatho.py ADDED Viewed

@@ -0,0 +1,158 @@
+"""UniToPatho dataset class."""
+import functools
+import glob
+import os
+from typing import Callable, Dict, List, Literal
+import pandas as pd
+import torch
+from torchvision import tv_tensors
+from typing_extensions import override
+from eva.vision.data.datasets import _validators, vision
+from eva.vision.utils import io
+class UniToPatho(vision.VisionDataset[tv_tensors.Image, torch.Tensor]):
+    """Dataset class for UniToPatho images and corresponding targets."""
+    _expected_dataset_lengths: Dict[str | None, int] = {
+        "train": 6270,
+        "val": 2399,
+        None: 8669,
+    }
+    """Expected dataset lengths for the splits and complete dataset."""
+    _license: str = "CC BY 4.0 (https://creativecommons.org/licenses/by/4.0/)"
+    """Dataset license."""
+    def __init__(
+        self,
+        root: str,
+        split: Literal["train", "val"] | None = None,
+        transforms: Callable | None = None,
+    ) -> None:
+        """Initialize the dataset.
+        The dataset is split into train and validation by taking into account
+        the patient IDs to avoid any data leakage.
+        Args:
+            root: Path to the root directory of the dataset.
+            split: Dataset split to use. If `None`, the entire dataset is used.
+            transforms: A function/transform which returns a transformed
+                version of the raw data samples.
+        """
+        super().__init__(transforms=transforms)
+        self._root = root
+        self._split = split
+        self._indices: List[int] = []
+    @property
+    @override
+    def classes(self) -> List[str]:
+        return ["HP", "NORM", "TA.HG", "TA.LG", "TVA.HG", "TVA.LG"]
+    @property
+    @override
+    def class_to_idx(self) -> Dict[str, int]:
+        return {"HP": 0, "NORM": 1, "TA.HG": 2, "TA.LG": 3, "TVA.HG": 4, "TVA.LG": 5}
+    @property
+    def _dataset_path(self) -> str:
+        """Returns the path of the image data of the dataset."""
+        return os.path.join(self._root, "800")
+    @functools.cached_property
+    def _image_files(self) -> List[str]:
+        """Return the list of image files in the dataset.
+        Returns:
+            List of image file paths.
+        """
+        files_pattern = os.path.join(self._dataset_path, "**/*.png")
+        image_files = list(glob.glob(files_pattern, recursive=True))
+        return sorted(image_files)
+    @functools.cached_property
+    def _manifest(self) -> pd.DataFrame:
+        """Returns the train.csv & test.csv files as dataframe."""
+        df_train = pd.read_csv(os.path.join(self._dataset_path, "train.csv"))
+        df_val = pd.read_csv(os.path.join(self._dataset_path, "test.csv"))
+        df_train["split"], df_val["split"] = "train", "val"
+        return pd.concat([df_train, df_val], axis=0).set_index("image_id")
+    @override
+    def filename(self, index: int) -> str:
+        image_path = self._image_files[self._indices[index]]
+        return os.path.relpath(image_path, self._dataset_path)
+    @override
+    def prepare_data(self) -> None:
+        _validators.check_dataset_exists(self._root, True)
+    @override
+    def configure(self) -> None:
+        self._indices = self._make_indices()
+    @override
+    def validate(self) -> None:
+        _validators.check_dataset_integrity(
+            self,
+            length=self._expected_dataset_lengths[self._split],
+            n_classes=6,
+            first_and_last_labels=("HP", "TVA.LG"),
+        )
+    @override
+    def load_data(self, index: int) -> tv_tensors.Image:
+        image_path = self._image_files[self._indices[index]]
+        return io.read_image_as_tensor(image_path)
+    @override
+    def load_target(self, index: int) -> torch.Tensor:
+        target = self._extract_class(self._image_files[self._indices[index]])
+        return torch.tensor(target, dtype=torch.long)
+    @override
+    def __len__(self) -> int:
+        return len(self._indices)
+    def _print_license(self) -> None:
+        """Prints the dataset license."""
+        print(f"Dataset license: {self._license}")
+    def _extract_image_id(self, image_file: str) -> str:
+        """Extracts the image_id from the file name."""
+        return os.path.basename(image_file)
+    def _extract_class(self, file: str) -> int:
+        image_id = self._extract_image_id(file)
+        return int(self._manifest.at[image_id, "top_label"])
+    def _make_indices(self) -> List[int]:
+        """Builds the dataset indices for the specified split."""
+        train_indices = []
+        val_indices = []
+        for index, image_file in enumerate(self._image_files):
+            image_id = self._extract_image_id(image_file)
+            split = self._manifest.at[image_id, "split"]
+            if split == "train":
+                train_indices.append(index)
+            elif split == "val":
+                val_indices.append(index)
+            else:
+                raise ValueError(f"Invalid split value found: {split}")
+        split_indices = {
+            "train": train_indices,
+            "val": val_indices,
+            None: train_indices + val_indices,
+        }
+        return split_indices[self._split]

eva/vision/data/datasets/classification/wsi.py CHANGED Viewed

@@ -9,12 +9,13 @@ import torch
 from torchvision import tv_tensors
 from typing_extensions import override
-from eva.vision.data.datasets import wsi
-from eva.vision.data.datasets.classification import base
+from eva.vision.data.datasets import vision, wsi
 from eva.vision.data.wsi.patching import samplers
-class WsiClassificationDataset(wsi.MultiWsiDataset, base.ImageClassification):
+class WsiClassificationDataset(
+    wsi.MultiWsiDataset, vision.VisionDataset[tv_tensors.Image, torch.Tensor]
+):
     """A general dataset class for whole-slide image classification using manifest files."""
     default_column_mapping: Dict[str, str] = {
@@ -78,10 +79,10 @@ class WsiClassificationDataset(wsi.MultiWsiDataset, base.ImageClassification):
     @override
     def __getitem__(self, index: int) -> Tuple[tv_tensors.Image, torch.Tensor, Dict[str, Any]]:
-        return base.ImageClassification.__getitem__(self, index)
+        return vision.VisionDataset.__getitem__(self, index)
     @override
-    def load_image(self, index: int) -> tv_tensors.Image:
+    def load_data(self, index: int) -> tv_tensors.Image:
         return wsi.MultiWsiDataset.__getitem__(self, index)
     @override

eva/vision/data/datasets/segmentation/__init__.py CHANGED Viewed

@@ -1,7 +1,7 @@
 """Segmentation datasets API."""
-from eva.vision.data.datasets.segmentation.base import ImageSegmentation
 from eva.vision.data.datasets.segmentation.bcss import BCSS
+from eva.vision.data.datasets.segmentation.btcv import BTCV
 from eva.vision.data.datasets.segmentation.consep import CoNSeP
 from eva.vision.data.datasets.segmentation.embeddings import EmbeddingsSegmentationDataset
 from eva.vision.data.datasets.segmentation.lits import LiTS
@@ -10,8 +10,8 @@ from eva.vision.data.datasets.segmentation.monusac import MoNuSAC
 from eva.vision.data.datasets.segmentation.total_segmentator_2d import TotalSegmentator2D
 __all__ = [
-    "ImageSegmentation",
     "BCSS",
+    "BTCV",
     "CoNSeP",
     "EmbeddingsSegmentationDataset",
     "LiTS",

eva/vision/data/datasets/segmentation/_utils.py CHANGED Viewed

@@ -1,8 +1,12 @@
 from typing import Any, Tuple
 import numpy.typing as npt
+import torch
+from torchvision import tv_tensors
+from eva.vision.data import tv_tensors as eva_tv_tensors
 from eva.vision.data.datasets import wsi
+from eva.vision.utils import io
 def get_coords_at_index(
@@ -36,3 +40,46 @@ def extract_mask_patch(
     """
     (x, y), width, height = get_coords_at_index(dataset, index)
     return mask[y : y + height, x : x + width]
+def load_volume_tensor(file: str, orientation: str = "PLS") -> eva_tv_tensors.Volume:
+    """Load a volume from NIfTI file as :class:`eva.vision.data.tv_tensors.Volume`.
+    Args:
+        file: The path to the NIfTI file.
+        orientation: The orientation code to reorient the nifti image.
+    Returns:
+        Volume tensor representing of shape `[T, C, H, W]`.
+    """
+    nii = io.read_nifti(file, orientation=orientation)
+    array = io.nifti_to_array(nii)
+    array_reshaped_tchw = array[None, :, :, :].transpose(3, 0, 1, 2)
+    if nii.affine is None:
+        raise ValueError(f"Affine matrix is missing for {file}.")
+    affine = torch.tensor(nii.affine[:, [2, 0, 1, 3]], dtype=torch.float32)
+    return eva_tv_tensors.Volume(
+        array_reshaped_tchw, affine=affine, dtype=torch.float32
+    )  # type: ignore
+def load_mask_tensor(
+    file: str, volume_file: str | None = None, orientation: str = "PLS"
+) -> tv_tensors.Mask:
+    """Load a volume from NIfTI file as :class:`torchvision.tv_tensors.Mask`.
+    Args:
+        file: The path to the NIfTI file containing the mask.
+        volume_file: The path to the volume file used as orientation reference in case
+            the mask file is missing the pixdim array in the NIfTI header.
+        orientation: The orientation code to reorient the nifti image.
+    Returns:
+        Mask tensor of shape `[T, C, H, W]`.
+    """
+    nii = io.read_nifti(file, orientation="PLS", orientation_reference=volume_file)
+    array = io.nifti_to_array(nii)
+    array_reshaped_tchw = array[None, :, :, :].transpose(3, 0, 1, 2)
+    return tv_tensors.Mask(array_reshaped_tchw, dtype=torch.long)  # type: ignore

eva/vision/data/datasets/segmentation/bcss.py CHANGED Viewed

@@ -12,13 +12,13 @@ from torchvision import tv_tensors
 from torchvision.transforms.v2 import functional
 from typing_extensions import override
-from eva.vision.data.datasets import _validators, wsi
-from eva.vision.data.datasets.segmentation import _utils, base
+from eva.vision.data.datasets import _validators, vision, wsi
+from eva.vision.data.datasets.segmentation import _utils
 from eva.vision.data.wsi.patching import samplers
 from eva.vision.utils import io
-class BCSS(wsi.MultiWsiDataset, base.ImageSegmentation):
+class BCSS(wsi.MultiWsiDataset, vision.VisionDataset[tv_tensors.Image, tv_tensors.Mask]):
     """Dataset class for BCSS semantic segmentation task.
     Source: https://github.com/PathologyDataScience/BCSS
@@ -71,7 +71,6 @@ class BCSS(wsi.MultiWsiDataset, base.ImageSegmentation):
             width: Width of the patches to be extracted, in pixels.
             height: Height of the patches to be extracted, in pixels.
             target_mpp: Target microns per pixel (mpp) for the patches.
-            backend: The backend to use for reading the whole-slide images.
             transforms: Transforms to apply to the extracted image & mask patches.
         """
         self._split = split
@@ -90,7 +89,7 @@ class BCSS(wsi.MultiWsiDataset, base.ImageSegmentation):
             overwrite_mpp=0.25,
             backend="pil",
         )
-        base.ImageSegmentation.__init__(self, transforms=transforms)
+        vision.VisionDataset.__init__(self, transforms=transforms)
     @property
     @override
@@ -129,15 +128,15 @@ class BCSS(wsi.MultiWsiDataset, base.ImageSegmentation):
     @override
     def __getitem__(self, index: int) -> Tuple[tv_tensors.Image, tv_tensors.Mask, Dict[str, Any]]:
-        return base.ImageSegmentation.__getitem__(self, index)
+        return vision.VisionDataset.__getitem__(self, index)
     @override
-    def load_image(self, index: int) -> tv_tensors.Image:
+    def load_data(self, index: int) -> tv_tensors.Image:
         image_array = wsi.MultiWsiDataset.__getitem__(self, index)
         return functional.to_image(image_array)
     @override
-    def load_mask(self, index: int) -> tv_tensors.Mask:
+    def load_target(self, index: int) -> tv_tensors.Mask:
         path = self._get_mask_path(index)
         mask = io.read_image_as_array(path)
         mask_patch = _utils.extract_mask_patch(mask, self, index)

eva/vision/data/datasets/segmentation/btcv.py ADDED Viewed

@@ -0,0 +1,236 @@
+"""BTCV dataset."""
+import glob
+import os
+import re
+from typing import Any, Callable, Dict, List, Literal, Tuple
+import huggingface_hub
+from torchvision import tv_tensors
+from torchvision.datasets import utils as data_utils
+from typing_extensions import override
+from eva.vision.data import tv_tensors as eva_tv_tensors
+from eva.vision.data.datasets import _utils as _data_utils
+from eva.vision.data.datasets.segmentation import _utils
+from eva.vision.data.datasets.vision import VisionDataset
+class BTCV(VisionDataset[eva_tv_tensors.Volume, tv_tensors.Mask]):
+    """Beyond the Cranial Vault (BTCV) Abdomen dataset.
+    The BTCV dataset comprises abdominal CT acquired at the Vanderbilt
+    University Medical Center from metastatic liver cancer patients or
+    post-operative ventral hernia patients. The dataset contains one
+    background class and thirteen organ classes.
+    More info:
+      - Multi-organ Abdominal CT Reference Standard Segmentations
+        https://zenodo.org/records/1169361
+      - Dataset Split
+        https://github.com/Luffy03/Large-Scale-Medical/blob/main/Downstream/monai/BTCV/dataset/dataset_0.json
+    """
+    _split_index_ranges = {
+        "train": [(0, 24)],
+        "val": [(24, 30)],
+        None: [(0, 30)],
+    }
+    """Sample indices for the dataset splits."""
+    def __init__(
+        self,
+        root: str,
+        split: Literal["train", "val"] | None = None,
+        download: bool = False,
+        transforms: Callable | None = None,
+    ) -> None:
+        """Initializes the dataset.
+        Args:
+            root: Path to the dataset root directory.
+            split: Dataset split to use ('train' or 'val').
+                If None, it uses the full dataset.
+            download: Whether to download the dataset.
+            transforms: A callable object for applying data transformations.
+                If None, no transformations are applied.
+        """
+        super().__init__(transforms=transforms)
+        self._root = root
+        self._split = split
+        self._download = download
+        self._samples: List[Tuple[str, str]]
+        self._indices: List[int]
+    @property
+    @override
+    def classes(self) -> List[str]:
+        return [
+            "background",
+            "spleen",
+            "right_kidney",
+            "left_kidney",
+            "gallbladder",
+            "esophagus",
+            "liver",
+            "stomach",
+            "aorta",
+            "inferior_vena_cava",
+            "portal_and_splenic_vein",
+            "pancreas",
+            "right_adrenal_gland",
+            "left_adrenal_gland",
+        ]
+    @property
+    @override
+    def class_to_idx(self) -> Dict[str, int]:
+        return {label: index for index, label in enumerate(self.classes)}
+    @override
+    def filename(self, index: int) -> str:
+        return os.path.basename(self._samples[self._indices[index]][0])
+    @override
+    def prepare_data(self) -> None:
+        if self._download:
+            self._download_dataset()
+    @override
+    def configure(self) -> None:
+        self._samples = self._find_samples()
+        self._indices = self._make_indices()
+    @override
+    def validate(self) -> None:
+        def _valid_sample(index: int) -> bool:
+            """Indicates if the sample files exist and are reachable."""
+            volume_file, segmentation_file = self._samples[self._indices[index]]
+            return os.path.isfile(volume_file) and os.path.isfile(segmentation_file)
+        if len(self._samples) < len(self._indices):
+            raise OSError(f"Dataset is missing {len(self._indices) - len(self._samples)} files.")
+        invalid_samples = [self._samples[i] for i in range(len(self)) if not _valid_sample(i)]
+        if invalid_samples:
+            raise OSError(
+                f"Dataset '{self.__class__.__qualname__}' contains missing or "
+                f"corrupted samples  ({len(invalid_samples)} in total). "
+                f"Examples of missing folders: {str(invalid_samples[:10])[:-1]}, ...]. "
+            )
+    @override
+    def __getitem__(
+        self, index: int
+    ) -> tuple[eva_tv_tensors.Volume, tv_tensors.Mask, dict[str, Any]]:
+        volume = self.load_data(index)
+        mask = self.load_target(index)
+        metadata = self.load_metadata(index) or {}
+        volume_tensor, mask_tensor = self._apply_transforms(volume, mask)
+        return volume_tensor, mask_tensor, metadata
+    @override
+    def __len__(self) -> int:
+        return len(self._indices)
+    @override
+    def load_data(self, index: int) -> eva_tv_tensors.Volume:
+        """Loads the CT volume for a given sample.
+        Args:
+            index: The index of the desired sample.
+        Returns:
+            Tensor representing the CT volume of shape `[T, C, H, W]`.
+        """
+        ct_scan_file, _ = self._samples[self._indices[index]]
+        return _utils.load_volume_tensor(ct_scan_file)
+    @override
+    def load_target(self, index: int) -> tv_tensors.Mask:
+        """Loads the segmentation mask for a given sample.
+        Args:
+            index: The index of the desired sample.
+        Returns:
+            Tensor representing the segmentation mask of shape `[T, C, H, W]`.
+        """
+        ct_scan_file, mask_file = self._samples[self._indices[index]]
+        return _utils.load_mask_tensor(mask_file, ct_scan_file)
+    def _apply_transforms(
+        self, ct_scan: eva_tv_tensors.Volume, mask: tv_tensors.Mask
+    ) -> tuple[eva_tv_tensors.Volume, tv_tensors.Mask]:
+        """Applies transformations to the provided data.
+        Args:
+            ct_scan: The CT volume tensor.
+            mask: The segmentation mask tensor.
+        Returns:
+            A tuple containing the transformed CT and mask tensors.
+        """
+        return self._transforms(ct_scan, mask) if self._transforms else (ct_scan, mask)
+    def _find_samples(self) -> list[tuple[str, str]]:
+        """Retrieves the file paths for the CT volumes and segmentation.
+        Returns:
+            The a list of file path to the CT volumes and segmentation.
+        """
+        def filename_id(filename: str) -> int:
+            matches = re.match(r".*(?:\D|^)(\d+)", filename)
+            if matches is None:
+                raise ValueError(f"Filename '{filename}' is not valid.")
+            return int(matches.group(1))
+        subdir = os.path.join(self._root, "BTCV")
+        root = subdir if os.path.isdir(subdir) else self._root
+        volume_files_pattern = os.path.join(root, "imagesTr", "*.nii.gz")
+        volume_filenames = glob.glob(volume_files_pattern)
+        volume_ids = {filename_id(filename): filename for filename in volume_filenames}
+        segmentation_files_pattern = os.path.join(root, "labelsTr", "*.nii.gz")
+        segmentation_filenames = glob.glob(segmentation_files_pattern)
+        segmentation_ids = {filename_id(filename): filename for filename in segmentation_filenames}
+        return [
+            (volume_ids[file_id], segmentation_ids[file_id])
+            for file_id in sorted(volume_ids.keys() & segmentation_ids.keys())
+        ]
+    def _make_indices(self) -> list[int]:
+        """Builds the dataset indices for the specified split."""
+        index_ranges = self._split_index_ranges.get(self._split)
+        if index_ranges is None:
+            raise ValueError("Invalid data split. Use 'train', 'val' or `None`.")
+        return _data_utils.ranges_to_indices(index_ranges)
+    def _download_dataset(self) -> None:
+        hf_token = os.getenv("HF_TOKEN")
+        if not hf_token:
+            raise ValueError("Huggingface token required, please set the HF_TOKEN env variable.")
+        huggingface_hub.snapshot_download(
+            "Luffy503/VoCo_Downstream",
+            repo_type="dataset",
+            token=hf_token,
+            local_dir=self._root,
+            ignore_patterns=[".git*"],
+            allow_patterns=["BTCV.zip"],
+        )
+        zip_path = os.path.join(self._root, "BTCV.zip")
+        if not os.path.exists(zip_path):
+            raise FileNotFoundError(
+                f"BTCV.zip not found in {self._root}, something with the download went wrong."
+            )
+        data_utils.extract_archive(zip_path, self._root, remove_finished=True)

eva/vision/data/datasets/segmentation/consep.py CHANGED Viewed

@@ -11,13 +11,13 @@ from torchvision import tv_tensors
 from torchvision.transforms.v2 import functional
 from typing_extensions import override
-from eva.vision.data.datasets import _validators, wsi
-from eva.vision.data.datasets.segmentation import _utils, base
+from eva.vision.data.datasets import _validators, vision, wsi
+from eva.vision.data.datasets.segmentation import _utils
 from eva.vision.data.wsi.patching import samplers
 from eva.vision.utils import io
-class CoNSeP(wsi.MultiWsiDataset, base.ImageSegmentation):
+class CoNSeP(wsi.MultiWsiDataset, vision.VisionDataset[tv_tensors.Image, tv_tensors.Mask]):
     """Dataset class for CoNSeP semantic segmentation task.
     As in [1], we combine classes 3 (healthy epithelial) & 4 (dysplastic/malignant epithelial)
@@ -55,7 +55,6 @@ class CoNSeP(wsi.MultiWsiDataset, base.ImageSegmentation):
             width: Width of the patches to be extracted, in pixels.
             height: Height of the patches to be extracted, in pixels.
             target_mpp: Target microns per pixel (mpp) for the patches.
-            backend: The backend to use for reading the whole-slide images.
             transforms: Transforms to apply to the extracted image & mask patches.
         """
         self._split = split
@@ -112,15 +111,15 @@ class CoNSeP(wsi.MultiWsiDataset, base.ImageSegmentation):
     @override
     def __getitem__(self, index: int) -> Tuple[tv_tensors.Image, tv_tensors.Mask, Dict[str, Any]]:
-        return base.ImageSegmentation.__getitem__(self, index)
+        return vision.VisionDataset.__getitem__(self, index)
     @override
-    def load_image(self, index: int) -> tv_tensors.Image:
+    def load_data(self, index: int) -> tv_tensors.Image:
         image_array = wsi.MultiWsiDataset.__getitem__(self, index)
         return functional.to_image(image_array)
     @override
-    def load_mask(self, index: int) -> tv_tensors.Mask:
+    def load_target(self, index: int) -> tv_tensors.Mask:
         path = self._get_mask_path(index)
         mask = np.array(io.read_mat(path)["type_map"])
         mask_patch = _utils.extract_mask_patch(mask, self, index)

eva/vision/data/datasets/segmentation/embeddings.py CHANGED Viewed

@@ -14,7 +14,7 @@ class EmbeddingsSegmentationDataset(embeddings_base.EmbeddingsDataset[tv_tensors
     """Embeddings segmentation dataset."""
     @override
-    def _load_embeddings(self, index: int) -> List[torch.Tensor]:
+    def load_embeddings(self, index: int) -> List[torch.Tensor]:
         filename = self.filename(index)
         embeddings_path = os.path.join(self._root, filename)
         embeddings = torch.load(embeddings_path, map_location="cpu")
@@ -23,7 +23,7 @@ class EmbeddingsSegmentationDataset(embeddings_base.EmbeddingsDataset[tv_tensors
         return [tensor.squeeze(0) for tensor in embeddings]
     @override
-    def _load_target(self, index: int) -> tv_tensors.Mask:
+    def load_target(self, index: int) -> tv_tensors.Mask:
         filename = self._data.at[index, self._column_mapping["target"]]
         mask_path = os.path.join(self._root, filename)
         semantic_labels = torch.load(mask_path, map_location="cpu")

eva/vision/data/datasets/segmentation/lits.py CHANGED Viewed

@@ -13,12 +13,11 @@ from typing_extensions import override
 from eva.core import utils
 from eva.core.data import splitting
-from eva.vision.data.datasets import _validators
-from eva.vision.data.datasets.segmentation import base
+from eva.vision.data.datasets import _validators, vision
 from eva.vision.utils import io
-class LiTS(base.ImageSegmentation):
+class LiTS(vision.VisionDataset[tv_tensors.Image, tv_tensors.Mask]):
     """LiTS - Liver Tumor Segmentation Challenge.
     Webpage: https://competitions.codalab.org/competitions/17094
@@ -110,21 +109,23 @@ class LiTS(base.ImageSegmentation):
         )
     @override
-    def load_image(self, index: int) -> tv_tensors.Image:
+    def load_data(self, index: int) -> tv_tensors.Image:
         sample_index, slice_index = self._indices[index]
         volume_path = self._volume_files[sample_index]
-        image_array = io.read_nifti(volume_path, slice_index)
+        image_nii = io.read_nifti(volume_path, slice_index)
+        image_array = io.nifti_to_array(image_nii)
         if self._fix_orientation:
             image_array = self._orientation(image_array, sample_index)
         return tv_tensors.Image(image_array.transpose(2, 0, 1))
     @override
-    def load_mask(self, index: int) -> tv_tensors.Mask:
+    def load_target(self, index: int) -> tv_tensors.Mask:
         sample_index, slice_index = self._indices[index]
         segmentation_path = self._segmentation_file(sample_index)
-        semantic_labels = io.read_nifti(segmentation_path, slice_index)
+        mask_nii = io.read_nifti(segmentation_path, slice_index)
+        mask_array = io.nifti_to_array(mask_nii)
         if self._fix_orientation:
-            semantic_labels = self._orientation(semantic_labels, sample_index)
+            semantic_labels = self._orientation(mask_array, sample_index)
         return tv_tensors.Mask(semantic_labels.squeeze(), dtype=torch.int64)  # type: ignore[reportCallIssue]
     def _orientation(self, array: npt.NDArray, sample_index: int) -> npt.NDArray:

eva/vision/data/datasets/segmentation/lits_balanced.py CHANGED Viewed

@@ -64,7 +64,8 @@ class LiTSBalanced(lits.LiTS):
             if sample_idx not in split_indices:
                 continue
-            segmentation = io.read_nifti(self._segmentation_file(sample_idx))
+            segmentation_nii = io.read_nifti(self._segmentation_file(sample_idx))
+            segmentation = io.nifti_to_array(segmentation_nii)
             tumor_filter = segmentation == 2
             tumor_slice_filter = tumor_filter.sum(axis=(0, 1)) > 0

kaiko-eva 0.1.8__py3-none-any.whl → 0.2.1__py3-none-any.whl

kaiko-eva 0.1.8py3-none-any.whl → 0.2.1py3-none-any.whl