PyPI - maite-datasets - Versions diffs - 0.0.5__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

maite-datasets 0.0.5py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

maite_datasets/__init__.py +2 -6
maite_datasets/_base.py +169 -51
maite_datasets/_builder.py +46 -55
maite_datasets/_collate.py +2 -3
maite_datasets/{_reader/_base.py → _reader.py} +62 -36
maite_datasets/_validate.py +4 -2
maite_datasets/image_classification/_cifar10.py +12 -7
maite_datasets/image_classification/_mnist.py +15 -10
maite_datasets/image_classification/_ships.py +12 -8
maite_datasets/object_detection/__init__.py +4 -7
maite_datasets/object_detection/_antiuav.py +11 -8
maite_datasets/{_reader → object_detection}/_coco.py +29 -27
maite_datasets/object_detection/_milco.py +11 -9
maite_datasets/object_detection/_seadrone.py +11 -9
maite_datasets/object_detection/_voc.py +11 -13
maite_datasets/{_reader → object_detection}/_yolo.py +26 -21
maite_datasets/protocols.py +23 -0
maite_datasets/wrappers/__init__.py +8 -0
maite_datasets/wrappers/_torch.py +111 -0
{maite_datasets-0.0.5.dist-info → maite_datasets-0.0.6.dist-info}/METADATA +56 -3
maite_datasets-0.0.6.dist-info/RECORD +26 -0
maite_datasets/_mixin/__init__.py +0 -0
maite_datasets/_mixin/_numpy.py +0 -28
maite_datasets/_mixin/_torch.py +0 -28
maite_datasets/_protocols.py +0 -217
maite_datasets/_reader/__init__.py +0 -6
maite_datasets/_reader/_factory.py +0 -64
maite_datasets/_types.py +0 -50
maite_datasets/object_detection/_voc_torch.py +0 -65
maite_datasets-0.0.5.dist-info/RECORD +0 -31
{maite_datasets-0.0.5.dist-info → maite_datasets-0.0.6.dist-info}/WHEEL +0 -0
{maite_datasets-0.0.5.dist-info → maite_datasets-0.0.6.dist-info}/licenses/LICENSE +0 -0

maite_datasets/image_classification/_cifar10.py CHANGED Viewed

@@ -2,15 +2,20 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence, TypeVar
+from typing import Any, Literal, TypeVar
 import numpy as np
 from numpy.typing import NDArray
-from maite_datasets._base import BaseICDataset, DataLocation
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseICDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyImageClassificationTransform,
+)
 CIFARClassStringMap = Literal[
     "airplane",
@@ -27,7 +32,7 @@ CIFARClassStringMap = Literal[
 TCIFARClassMap = TypeVar("TCIFARClassMap", CIFARClassStringMap, int, list[CIFARClassStringMap], list[int])
-class CIFAR10(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
+class CIFAR10(BaseICDataset[NumpyArray], BaseDatasetNumpyMixin):
     """
     `CIFAR10 <https://www.cs.toronto.edu/~kriz/cifar.html>`_ Dataset as NumPy arrays.
@@ -89,7 +94,7 @@ class CIFAR10(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
         self,
         root: str | Path,
         image_set: Literal["train", "test", "base"] = "train",
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyImageClassificationTransform | Sequence[NumpyImageClassificationTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:
@@ -214,7 +219,7 @@ class CIFAR10(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
                 images[i, 2] = blue_channel  # Blue channel
         return images, labels
-    def _read_file(self, path: str) -> NDArray[np.number[Any]]:
+    def _read_file(self, path: str) -> NumpyArray:
         """
         Function to grab the correct image from the loaded data.
         Overwrite of the base `_read_file` because data is an all or nothing load.

maite_datasets/image_classification/_mnist.py CHANGED Viewed

@@ -2,15 +2,20 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence, TypeVar
+from typing import Any, Literal, TypeVar
 import numpy as np
 from numpy.typing import NDArray
-from maite_datasets._base import BaseICDataset, DataLocation
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseICDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyImageClassificationTransform,
+)
 MNISTClassStringMap = Literal["zero", "one", "two", "three", "four", "five", "six", "seven", "eight", "nine"]
 TMNISTClassMap = TypeVar("TMNISTClassMap", MNISTClassStringMap, int, list[MNISTClassStringMap], list[int])
@@ -34,7 +39,7 @@ CorruptionStringMap = Literal[
 ]
-class MNIST(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
+class MNIST(BaseICDataset[NumpyArray], BaseDatasetNumpyMixin):
     """`MNIST <https://en.wikipedia.org/wiki/MNIST_database>`_ Dataset and `Corruptions <https://arxiv.org/abs/1906.02337>`_.
     There are 15 different styles of corruptions. This class downloads differently depending on if you
@@ -118,7 +123,7 @@ class MNIST(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
         root: str | Path,
         image_set: Literal["train", "test", "base"] = "train",
         corruption: CorruptionStringMap | None = None,
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyImageClassificationTransform | Sequence[NumpyImageClassificationTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:
@@ -149,7 +154,7 @@ class MNIST(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
         index_strings = np.arange(self._loaded_data.shape[0]).astype(str).tolist()
         return index_strings, labels.tolist(), {}
-    def _load_corruption(self) -> tuple[NDArray[np.number[Any]], NDArray[np.uintp]]:
+    def _load_corruption(self) -> tuple[NumpyArray, NDArray[np.uintp]]:
         """Function to load in the file paths for the data and labels for the different corrupt data formats"""
         corruption = self.corruption if self.corruption is not None else "identity"
         base_path = self.path / "mnist_c" / corruption
@@ -176,7 +181,7 @@ class MNIST(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
         return data, labels
-    def _grab_data(self, path: Path) -> tuple[NDArray[np.number[Any]], NDArray[np.uintp]]:
+    def _grab_data(self, path: Path) -> tuple[NumpyArray, NDArray[np.uintp]]:
         """Function to load in the data numpy array"""
         with np.load(path, allow_pickle=True) as data_array:
             if self.image_set == "base":
@@ -190,11 +195,11 @@ class MNIST(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
             data = np.expand_dims(data, axis=1)
         return data, labels
-    def _grab_corruption_data(self, path: Path) -> NDArray[np.number[Any]]:
+    def _grab_corruption_data(self, path: Path) -> NumpyArray:
         """Function to load in the data numpy array for the previously chosen corrupt format"""
         return np.load(path, allow_pickle=False)
-    def _read_file(self, path: str) -> NDArray[np.number[Any]]:
+    def _read_file(self, path: str) -> NumpyArray:
         """
         Function to grab the correct image from the loaded data.
         Overwrite of the base `_read_file` because data is an all or nothing load.

maite_datasets/image_classification/_ships.py CHANGED Viewed

@@ -2,18 +2,22 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Sequence
+from typing import Any
 import numpy as np
-from numpy.typing import NDArray
-from maite_datasets._base import BaseICDataset, DataLocation
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseICDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyImageClassificationTransform,
+)
-class Ships(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
+class Ships(BaseICDataset[NumpyArray], BaseDatasetNumpyMixin):
     """
     A dataset that focuses on identifying ships from satellite images.
@@ -76,7 +80,7 @@ class Ships(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
     def __init__(
         self,
         root: str | Path,
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyImageClassificationTransform | Sequence[NumpyImageClassificationTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:
@@ -125,7 +129,7 @@ class Ships(BaseICDataset[NDArray[np.number[Any]]], BaseDatasetNumpyMixin):
         """Function to load in the file paths for the scene images"""
         return sorted(str(entry) for entry in (self.path / "scenes").glob("*.png"))
-    def get_scene(self, index: int) -> NDArray[np.number[Any]]:
+    def get_scene(self, index: int) -> NumpyArray:
         """
         Get the desired satellite image (scene) by passing in the index of the desired file.

maite_datasets/object_detection/__init__.py CHANGED Viewed

@@ -1,20 +1,17 @@
 """Module for MAITE compliant Object Detection datasets."""
 from maite_datasets.object_detection._antiuav import AntiUAVDetection
+from maite_datasets.object_detection._coco import COCODatasetReader
 from maite_datasets.object_detection._milco import MILCO
 from maite_datasets.object_detection._seadrone import SeaDrone
 from maite_datasets.object_detection._voc import VOCDetection
+from maite_datasets.object_detection._yolo import YOLODatasetReader
 __all__ = [
     "AntiUAVDetection",
     "MILCO",
     "SeaDrone",
     "VOCDetection",
+    "COCODatasetReader",
+    "YOLODatasetReader",
 ]
-import importlib.util
-if importlib.util.find_spec("torch") is not None:
-    from maite_datasets.object_detection._voc_torch import VOCDetectionTorch
-    __all__ += ["VOCDetectionTorch"]

maite_datasets/object_detection/_antiuav.py CHANGED Viewed

@@ -2,19 +2,22 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence
+from typing import Any, Literal
-import numpy as np
 from defusedxml.ElementTree import parse
-from numpy.typing import NDArray
-from maite_datasets._base import BaseODDataset, DataLocation
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseODDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyObjectDetectionTransform,
+)
-class AntiUAVDetection(BaseODDataset[NDArray[np.number[Any]], list[str], str], BaseDatasetNumpyMixin):
+class AntiUAVDetection(BaseODDataset[NumpyArray, list[str], str], BaseDatasetNumpyMixin):
     """
     A UAV detection dataset focused on detecting UAVs in natural images against large variation in backgrounds.
@@ -101,7 +104,7 @@ class AntiUAVDetection(BaseODDataset[NDArray[np.number[Any]], list[str], str], B
         self,
         root: str | Path,
         image_set: Literal["train", "val", "test", "base"] = "train",
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyObjectDetectionTransform | Sequence[NumpyObjectDetectionTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:

maite_datasets/{_reader → object_detection}/_coco.py RENAMED Viewed

@@ -3,20 +3,19 @@
 from __future__ import annotations
 import json
-import logging
 from pathlib import Path
 from typing import Any
+import maite.protocols.object_detection as od
 import numpy as np
+from maite.protocols import DatasetMetadata, DatumMetadata
 from PIL import Image
-from maite_datasets._protocols import DatasetMetadata, DatumMetadata, ObjectDetectionDataset, ObjectDetectionDatum
-from maite_datasets._reader._base import _ObjectDetectionTarget, BaseDatasetReader
+from maite_datasets._base import BaseDataset, ObjectDetectionTarget
+from maite_datasets._reader import BaseDatasetReader
-_logger = logging.getLogger(__name__)
-class COCODatasetReader(BaseDatasetReader):
+class COCODatasetReader(BaseDatasetReader[od.Dataset]):
     """
     COCO format dataset reader conforming to MAITE protocols.
@@ -132,9 +131,9 @@ class COCODatasetReader(BaseDatasetReader):
         """Mapping from class index to class name."""
         return self._index2label
-    def _create_dataset_implementation(self) -> ObjectDetectionDataset:
+    def create_dataset(self) -> od.Dataset:
         """Create COCO dataset implementation."""
-        return _COCODataset(self)
+        return COCODataset(self)
     def _validate_format_specific(self) -> tuple[list[str], dict[str, Any]]:
         """Validate COCO format specific files and structure."""
@@ -198,37 +197,40 @@ class COCODatasetReader(BaseDatasetReader):
         else:
             class_names = [cat["name"] for cat in self._coco_data["categories"]]
-        self._index2label = {idx: name for idx, name in enumerate(class_names)}
+        self._index2label = dict(enumerate(class_names))
-class _COCODataset:
+class COCODataset(BaseDataset):
     """Internal COCO dataset implementation."""
     def __init__(self, reader: COCODatasetReader) -> None:
-        self.reader = reader
-        self.image_ids = list(reader._image_id_to_info.keys())
-    @property
-    def metadata(self) -> DatasetMetadata:
-        return DatasetMetadata(
-            id=self.reader.dataset_id,
-            index2label=self.reader.index2label,
+        self._reader = reader
+        self._image_ids = list(reader._image_id_to_info.keys())
+        self.root = reader.dataset_path
+        self.images_path = reader._images_path
+        self.annotation_path = reader._annotation_path
+        self.size = len(reader._image_id_to_info)
+        self.classes = reader.index2label
+        self.metadata = DatasetMetadata(
+            id=self._reader.dataset_id,
+            index2label=self._reader.index2label,
         )
     def __len__(self) -> int:
-        return len(self.image_ids)
+        return len(self._image_ids)
-    def __getitem__(self, index: int) -> ObjectDetectionDatum:
-        image_id = self.image_ids[index]
-        image_info = self.reader._image_id_to_info[image_id]
+    def __getitem__(self, index: int) -> tuple[od.InputType, od.ObjectDetectionTarget, DatumMetadata]:
+        image_id = self._image_ids[index]
+        image_info = self._reader._image_id_to_info[image_id]
         # Load image
-        image_path = self.reader._images_path / image_info["file_name"]
+        image_path = self._reader._images_path / image_info["file_name"]
         image = np.array(Image.open(image_path).convert("RGB"))
         image = np.transpose(image, (2, 0, 1))  # Convert to CHW format
         # Get annotations for this image
-        annotations = self.reader.image_id_to_annotations.get(image_id, [])
+        annotations = self._reader.image_id_to_annotations.get(image_id, [])
         if annotations:
             boxes = []
@@ -241,7 +243,7 @@ class _COCODataset:
                 boxes.append([x, y, x + w, y + h])
                 # Map category_id to class index
-                cat_idx = self.reader._category_id_to_idx[ann["category_id"]]
+                cat_idx = self._reader._category_id_to_idx[ann["category_id"]]
                 labels.append(cat_idx)
                 # Collect annotation metadata
@@ -267,12 +269,12 @@ class _COCODataset:
             scores = np.empty(0, dtype=np.float32)
             annotation_metadata = []
-        target = _ObjectDetectionTarget(boxes, labels, scores)
+        target = ObjectDetectionTarget(boxes, labels, scores)
         # Create comprehensive datum metadata
         datum_metadata = DatumMetadata(
             **{
-                "id": f"{self.reader.dataset_id}_{image_id}",
+                "id": f"{self._reader.dataset_id}_{image_id}",
                 # Image-level metadata
                 "coco_image_id": image_id,
                 "file_name": image_info["file_name"],

maite_datasets/object_detection/_milco.py CHANGED Viewed

@@ -2,18 +2,20 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence
+from typing import Any, Literal
-import numpy as np
-from numpy.typing import NDArray
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseODDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyObjectDetectionTransform,
+)
-from maite_datasets._base import BaseODDataset, DataLocation
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
-class MILCO(BaseODDataset[NDArray[np.number[Any]], list[str], str], BaseDatasetNumpyMixin):
+class MILCO(BaseODDataset[NumpyArray, list[str], str], BaseDatasetNumpyMixin):
     """
     A side-scan sonar dataset focused on mine-like object detection.
@@ -116,7 +118,7 @@ class MILCO(BaseODDataset[NDArray[np.number[Any]], list[str], str], BaseDatasetN
         self,
         root: str | Path,
         image_set: Literal["train", "operational", "base"] = "train",
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyObjectDetectionTransform | Sequence[NumpyObjectDetectionTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:

maite_datasets/object_detection/_seadrone.py CHANGED Viewed

@@ -3,21 +3,23 @@ from __future__ import annotations
 __all__ = []
 import json
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence
+from typing import Any, Literal
-import numpy as np
-from numpy.typing import NDArray
-from maite_datasets._base import BaseODDataset, DataLocation
+from maite_datasets._base import (
+    BaseDatasetNumpyMixin,
+    BaseODDataset,
+    DataLocation,
+    NumpyArray,
+    NumpyObjectDetectionTransform,
+)
 from maite_datasets._fileio import _ensure_exists
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
 class SeaDrone(
     BaseODDataset[
-        NDArray[np.number[Any]],
+        NumpyArray,
         list[tuple[list[int], list[list[float]]]],
         tuple[list[int], list[list[float]]],
     ],
@@ -313,7 +315,7 @@ class SeaDrone(
         self,
         root: str | Path,
         image_set: Literal["train", "val", "test", "base"] = "train",
-        transforms: Transform[NDArray[np.number[Any]]] | Sequence[Transform[NDArray[np.number[Any]]]] | None = None,
+        transforms: NumpyObjectDetectionTransform | Sequence[NumpyObjectDetectionTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:

maite_datasets/object_detection/_voc.py CHANGED Viewed

@@ -4,24 +4,22 @@ __all__ = []
 import os
 import shutil
+from collections.abc import Sequence
 from pathlib import Path
-from typing import Any, Literal, Sequence, TypeVar
+from typing import Any, Literal, TypeVar
-import numpy as np
 from defusedxml.ElementTree import parse
-from numpy.typing import NDArray
 from maite_datasets._base import (
-    BaseDataset,
+    BaseDatasetNumpyMixin,
+    BaseDownloadedDataset,
     BaseODDataset,
     DataLocation,
+    NumpyArray,
+    NumpyObjectDetectionTransform,
+    ObjectDetectionTarget,
     _ensure_exists,
-    _TArray,
-    _TTarget,
 )
-from maite_datasets._mixin._numpy import BaseDatasetNumpyMixin
-from maite_datasets._protocols import Transform
-from maite_datasets._types import ObjectDetectionTarget
 VOCClassStringMap = Literal[
     "aeroplane",
@@ -48,7 +46,7 @@ VOCClassStringMap = Literal[
 TVOCClassMap = TypeVar("TVOCClassMap", VOCClassStringMap, int, list[VOCClassStringMap], list[int])
-class BaseVOCDataset(BaseDataset[_TArray, _TTarget, list[str], str]):
+class BaseVOCDataset(BaseDownloadedDataset[NumpyArray, ObjectDetectionTarget, list[str], str]):
     _resources = [
         DataLocation(
             url="https://data.brainchip.com/dataset-mirror/voc/VOCtrainval_11-May-2012.tar",
@@ -130,7 +128,7 @@ class BaseVOCDataset(BaseDataset[_TArray, _TTarget, list[str], str]):
         root: str | Path,
         image_set: Literal["train", "val", "test", "base"] = "train",
         year: Literal["2007", "2008", "2009", "2010", "2011", "2012"] = "2012",
-        transforms: Transform[_TArray] | Sequence[Transform[_TArray]] | None = None,
+        transforms: NumpyObjectDetectionTransform | Sequence[NumpyObjectDetectionTransform] | None = None,
         download: bool = False,
         verbose: bool = False,
     ) -> None:
@@ -432,8 +430,8 @@ class BaseVOCDataset(BaseDataset[_TArray, _TTarget, list[str], str]):
 class VOCDetection(
-    BaseVOCDataset[NDArray[np.number[Any]], ObjectDetectionTarget[NDArray[np.number[Any]]]],
-    BaseODDataset[NDArray[np.number[Any]], list[str], str],
+    BaseVOCDataset,
+    BaseODDataset[NumpyArray, list[str], str],
     BaseDatasetNumpyMixin,
 ):
     """

maite_datasets/{_reader → object_detection}/_yolo.py RENAMED Viewed

@@ -7,14 +7,16 @@ __all__ = []
 from pathlib import Path
 from typing import Any
+import maite.protocols.object_detection as od
 import numpy as np
+from maite.protocols import DatasetMetadata, DatumMetadata
 from PIL import Image
-from maite_datasets._protocols import DatasetMetadata, DatumMetadata, ObjectDetectionDataset, ObjectDetectionDatum
-from maite_datasets._reader._base import _ObjectDetectionTarget, BaseDatasetReader
+from maite_datasets._base import BaseDataset, ObjectDetectionTarget
+from maite_datasets._reader import BaseDatasetReader
-class YOLODatasetReader(BaseDatasetReader):
+class YOLODatasetReader(BaseDatasetReader[od.Dataset]):
     """
     YOLO format dataset reader conforming to MAITE protocols.
@@ -120,9 +122,9 @@ class YOLODatasetReader(BaseDatasetReader):
         """Mapping from class index to class name."""
         return self._index2label
-    def _create_dataset_implementation(self) -> ObjectDetectionDataset:
+    def create_dataset(self) -> od.Dataset:
         """Create YOLO dataset implementation."""
-        return _YOLODataset(self)
+        return YOLODataset(self)
     def _validate_format_specific(self) -> tuple[list[str], dict[str, Any]]:
         """Validate YOLO format specific files and structure."""
@@ -200,7 +202,7 @@ class YOLODatasetReader(BaseDatasetReader):
         """Load class names from classes file."""
         with open(self._classes_path) as f:
             class_names = [line.strip() for line in f if line.strip()]
-        self._index2label = {idx: name for idx, name in enumerate(class_names)}
+        self._index2label = dict(enumerate(class_names))
     def _find_image_files(self) -> None:
         """Find all valid image files."""
@@ -213,32 +215,35 @@ class YOLODatasetReader(BaseDatasetReader):
             raise ValueError(f"No image files found in {self._images_path}")
-class _YOLODataset:
+class YOLODataset(BaseDataset):
     """Internal YOLO dataset implementation."""
     def __init__(self, reader: YOLODatasetReader) -> None:
-        self.reader = reader
-    @property
-    def metadata(self) -> DatasetMetadata:
-        return DatasetMetadata(
-            id=self.reader.dataset_id,
-            index2label=self.reader.index2label,
+        self._reader = reader
+        self.root = reader.dataset_path
+        self.images_path = reader._images_path
+        self.annotation_path = reader._labels_path
+        self.size = len(reader._image_files)
+        self.classes = reader.index2label
+        self.metadata = DatasetMetadata(
+            id=self._reader.dataset_id,
+            index2label=self._reader.index2label,
         )
     def __len__(self) -> int:
-        return len(self.reader._image_files)
+        return len(self._reader._image_files)
-    def __getitem__(self, index: int) -> ObjectDetectionDatum:
-        image_path = self.reader._image_files[index]
+    def __getitem__(self, index: int) -> tuple[od.InputType, od.ObjectDetectionTarget, DatumMetadata]:
+        image_path = self._reader._image_files[index]
         # Load image
-        image = np.array(Image.open(image_path).convert("RGB"))
+        image = np.asarray(Image.open(image_path).convert("RGB"), dtype=np.uint8)
         img_height, img_width = image.shape[:2]
         image = np.transpose(image, (2, 0, 1))  # Convert to CHW format
         # Load corresponding label file
-        label_path = self.reader._labels_path / f"{image_path.stem}.txt"
+        label_path = self._reader._labels_path / f"{image_path.stem}.txt"
         annotation_metadata = []
         if label_path.exists():
@@ -292,12 +297,12 @@ class _YOLODataset:
             labels = np.empty(0, dtype=np.int64)
             scores = np.empty(0, dtype=np.float32)
-        target = _ObjectDetectionTarget(boxes, labels, scores)
+        target = ObjectDetectionTarget(boxes, labels, scores)
         # Create comprehensive datum metadata
         datum_metadata = DatumMetadata(
             **{
-                "id": f"{self.reader.dataset_id}_{image_path.stem}",
+                "id": f"{self._reader.dataset_id}_{image_path.stem}",
                 # Image-level metadata
                 "file_name": image_path.name,
                 "file_path": str(image_path),

maite_datasets/protocols.py ADDED Viewed

@@ -0,0 +1,23 @@
+"""
+Common type protocols used for interoperability.
+"""
+from collections.abc import Iterator
+from typing import Any, Protocol, runtime_checkable
+@runtime_checkable
+class Array(Protocol):
+    """
+    Protocol for interoperable array objects.
+    Supports common array representations with popular libraries like
+    PyTorch, Tensorflow and JAX, as well as NumPy arrays.
+    """
+    @property
+    def shape(self) -> tuple[int, ...]: ...
+    def __array__(self) -> Any: ...
+    def __getitem__(self, key: Any, /) -> Any: ...
+    def __iter__(self) -> Iterator[Any]: ...
+    def __len__(self) -> int: ...

maite_datasets/wrappers/__init__.py ADDED Viewed

@@ -0,0 +1,8 @@
+import importlib.util
+__all__ = []
+if importlib.util.find_spec("torch") is not None and importlib.util.find_spec("torchvision") is not None:
+    from ._torch import TorchvisionWrapper
+    __all__ += ["TorchvisionWrapper"]

maite-datasets 0.0.5__py3-none-any.whl → 0.0.6__py3-none-any.whl

maite-datasets 0.0.5py3-none-any.whl → 0.0.6py3-none-any.whl