PyPI - careamics - Versions diffs - 0.0.19__py3-none-any.whl - Mend

careamics 0.0.19__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (279) hide show

careamics/__init__.py +24 -0
careamics/careamist.py +961 -0
careamics/cli/__init__.py +5 -0
careamics/cli/conf.py +394 -0
careamics/cli/main.py +234 -0
careamics/cli/utils.py +27 -0
careamics/config/__init__.py +66 -0
careamics/config/algorithms/__init__.py +21 -0
careamics/config/algorithms/care_algorithm_config.py +122 -0
careamics/config/algorithms/hdn_algorithm_config.py +103 -0
careamics/config/algorithms/microsplit_algorithm_config.py +103 -0
careamics/config/algorithms/n2n_algorithm_config.py +115 -0
careamics/config/algorithms/n2v_algorithm_config.py +296 -0
careamics/config/algorithms/pn2v_algorithm_config.py +301 -0
careamics/config/algorithms/unet_algorithm_config.py +91 -0
careamics/config/algorithms/vae_algorithm_config.py +178 -0
careamics/config/architectures/__init__.py +7 -0
careamics/config/architectures/architecture_config.py +37 -0
careamics/config/architectures/lvae_config.py +262 -0
careamics/config/architectures/unet_config.py +125 -0
careamics/config/configuration.py +367 -0
careamics/config/configuration_factories.py +2400 -0
careamics/config/data/__init__.py +27 -0
careamics/config/data/data_config.py +472 -0
careamics/config/data/inference_config.py +237 -0
careamics/config/data/ng_data_config.py +1038 -0
careamics/config/data/patch_filter/__init__.py +15 -0
careamics/config/data/patch_filter/filter_config.py +16 -0
careamics/config/data/patch_filter/mask_filter_config.py +17 -0
careamics/config/data/patch_filter/max_filter_config.py +15 -0
careamics/config/data/patch_filter/meanstd_filter_config.py +18 -0
careamics/config/data/patch_filter/shannon_filter_config.py +15 -0
careamics/config/data/patching_strategies/__init__.py +15 -0
careamics/config/data/patching_strategies/_overlapping_patched_config.py +102 -0
careamics/config/data/patching_strategies/_patched_config.py +56 -0
careamics/config/data/patching_strategies/random_patching_config.py +45 -0
careamics/config/data/patching_strategies/sequential_patching_config.py +25 -0
careamics/config/data/patching_strategies/tiled_patching_config.py +40 -0
careamics/config/data/patching_strategies/whole_patching_config.py +12 -0
careamics/config/data/tile_information.py +65 -0
careamics/config/lightning/__init__.py +15 -0
careamics/config/lightning/callbacks/__init__.py +8 -0
careamics/config/lightning/callbacks/callback_config.py +116 -0
careamics/config/lightning/optimizer_configs.py +186 -0
careamics/config/lightning/training_config.py +70 -0
careamics/config/losses/__init__.py +8 -0
careamics/config/losses/loss_config.py +60 -0
careamics/config/ng_configs/__init__.py +5 -0
careamics/config/ng_configs/n2v_configuration.py +64 -0
careamics/config/ng_configs/ng_configuration.py +256 -0
careamics/config/ng_factories/__init__.py +9 -0
careamics/config/ng_factories/algorithm_factory.py +120 -0
careamics/config/ng_factories/data_factory.py +154 -0
careamics/config/ng_factories/n2v_factory.py +256 -0
careamics/config/ng_factories/training_factory.py +69 -0
careamics/config/noise_model/__init__.py +12 -0
careamics/config/noise_model/likelihood_config.py +60 -0
careamics/config/noise_model/noise_model_config.py +149 -0
careamics/config/support/__init__.py +31 -0
careamics/config/support/supported_activations.py +27 -0
careamics/config/support/supported_algorithms.py +40 -0
careamics/config/support/supported_architectures.py +13 -0
careamics/config/support/supported_data.py +122 -0
careamics/config/support/supported_filters.py +17 -0
careamics/config/support/supported_loggers.py +10 -0
careamics/config/support/supported_losses.py +32 -0
careamics/config/support/supported_optimizers.py +57 -0
careamics/config/support/supported_patching_strategies.py +22 -0
careamics/config/support/supported_pixel_manipulations.py +15 -0
careamics/config/support/supported_struct_axis.py +21 -0
careamics/config/support/supported_transforms.py +12 -0
careamics/config/transformations/__init__.py +22 -0
careamics/config/transformations/n2v_manipulate_config.py +79 -0
careamics/config/transformations/normalize_config.py +59 -0
careamics/config/transformations/transform_config.py +45 -0
careamics/config/transformations/transform_unions.py +29 -0
careamics/config/transformations/xy_flip_config.py +43 -0
careamics/config/transformations/xy_random_rotate90_config.py +35 -0
careamics/config/utils/__init__.py +8 -0
careamics/config/utils/configuration_io.py +85 -0
careamics/config/validators/__init__.py +18 -0
careamics/config/validators/axes_validators.py +90 -0
careamics/config/validators/model_validators.py +84 -0
careamics/config/validators/patch_validators.py +55 -0
careamics/conftest.py +39 -0
careamics/dataset/__init__.py +17 -0
careamics/dataset/dataset_utils/__init__.py +19 -0
careamics/dataset/dataset_utils/dataset_utils.py +118 -0
careamics/dataset/dataset_utils/file_utils.py +141 -0
careamics/dataset/dataset_utils/iterate_over_files.py +84 -0
careamics/dataset/dataset_utils/running_stats.py +189 -0
careamics/dataset/in_memory_dataset.py +303 -0
careamics/dataset/in_memory_pred_dataset.py +88 -0
careamics/dataset/in_memory_tiled_pred_dataset.py +131 -0
careamics/dataset/iterable_dataset.py +294 -0
careamics/dataset/iterable_pred_dataset.py +121 -0
careamics/dataset/iterable_tiled_pred_dataset.py +141 -0
careamics/dataset/patching/__init__.py +1 -0
careamics/dataset/patching/patching.py +300 -0
careamics/dataset/patching/random_patching.py +110 -0
careamics/dataset/patching/sequential_patching.py +212 -0
careamics/dataset/patching/validate_patch_dimension.py +64 -0
careamics/dataset/tiling/__init__.py +10 -0
careamics/dataset/tiling/collate_tiles.py +33 -0
careamics/dataset/tiling/lvae_tiled_patching.py +375 -0
careamics/dataset/tiling/tiled_patching.py +166 -0
careamics/dataset_ng/README.md +212 -0
careamics/dataset_ng/__init__.py +0 -0
careamics/dataset_ng/dataset.py +365 -0
careamics/dataset_ng/demos/bsd68_demo.ipynb +361 -0
careamics/dataset_ng/demos/bsd68_zarr_demo.ipynb +453 -0
careamics/dataset_ng/demos/care_U2OS_demo.ipynb +330 -0
careamics/dataset_ng/demos/demo_custom_image_stack.ipynb +736 -0
careamics/dataset_ng/demos/demo_datamodule.ipynb +447 -0
careamics/dataset_ng/demos/demo_dataset.ipynb +278 -0
careamics/dataset_ng/demos/demo_patch_extractor.py +51 -0
careamics/dataset_ng/demos/mouse_nuclei_demo.ipynb +293 -0
careamics/dataset_ng/factory.py +180 -0
careamics/dataset_ng/grouped_index_sampler.py +73 -0
careamics/dataset_ng/image_stack/__init__.py +14 -0
careamics/dataset_ng/image_stack/czi_image_stack.py +396 -0
careamics/dataset_ng/image_stack/file_image_stack.py +140 -0
careamics/dataset_ng/image_stack/image_stack_protocol.py +93 -0
careamics/dataset_ng/image_stack/image_utils/__init__.py +6 -0
careamics/dataset_ng/image_stack/image_utils/image_stack_utils.py +125 -0
careamics/dataset_ng/image_stack/in_memory_image_stack.py +93 -0
careamics/dataset_ng/image_stack/zarr_image_stack.py +170 -0
careamics/dataset_ng/image_stack_loader/__init__.py +19 -0
careamics/dataset_ng/image_stack_loader/image_stack_loader_protocol.py +70 -0
careamics/dataset_ng/image_stack_loader/image_stack_loaders.py +273 -0
careamics/dataset_ng/image_stack_loader/zarr_utils.py +130 -0
careamics/dataset_ng/legacy_interoperability.py +175 -0
careamics/dataset_ng/microsplit_input_synth.py +377 -0
careamics/dataset_ng/patch_extractor/__init__.py +7 -0
careamics/dataset_ng/patch_extractor/limit_file_extractor.py +50 -0
careamics/dataset_ng/patch_extractor/patch_construction.py +151 -0
careamics/dataset_ng/patch_extractor/patch_extractor.py +117 -0
careamics/dataset_ng/patch_filter/__init__.py +20 -0
careamics/dataset_ng/patch_filter/coordinate_filter_protocol.py +27 -0
careamics/dataset_ng/patch_filter/filter_factory.py +95 -0
careamics/dataset_ng/patch_filter/mask_filter.py +96 -0
careamics/dataset_ng/patch_filter/max_filter.py +188 -0
careamics/dataset_ng/patch_filter/mean_std_filter.py +218 -0
careamics/dataset_ng/patch_filter/patch_filter_protocol.py +50 -0
careamics/dataset_ng/patch_filter/shannon_filter.py +188 -0
careamics/dataset_ng/patching_strategies/__init__.py +26 -0
careamics/dataset_ng/patching_strategies/patching_strategy_factory.py +50 -0
careamics/dataset_ng/patching_strategies/patching_strategy_protocol.py +161 -0
careamics/dataset_ng/patching_strategies/random_patching.py +393 -0
careamics/dataset_ng/patching_strategies/sequential_patching.py +99 -0
careamics/dataset_ng/patching_strategies/tiling_strategy.py +207 -0
careamics/dataset_ng/patching_strategies/whole_sample.py +61 -0
careamics/file_io/__init__.py +15 -0
careamics/file_io/read/__init__.py +11 -0
careamics/file_io/read/get_func.py +57 -0
careamics/file_io/read/tiff.py +58 -0
careamics/file_io/write/__init__.py +15 -0
careamics/file_io/write/get_func.py +63 -0
careamics/file_io/write/tiff.py +40 -0
careamics/lightning/__init__.py +32 -0
careamics/lightning/callbacks/__init__.py +13 -0
careamics/lightning/callbacks/data_stats_callback.py +33 -0
careamics/lightning/callbacks/hyperparameters_callback.py +49 -0
careamics/lightning/callbacks/prediction_writer_callback/__init__.py +20 -0
careamics/lightning/callbacks/prediction_writer_callback/file_path_utils.py +56 -0
careamics/lightning/callbacks/prediction_writer_callback/prediction_writer_callback.py +234 -0
careamics/lightning/callbacks/prediction_writer_callback/write_strategy.py +399 -0
careamics/lightning/callbacks/prediction_writer_callback/write_strategy_factory.py +215 -0
careamics/lightning/callbacks/progress_bar_callback.py +90 -0
careamics/lightning/dataset_ng/__init__.py +1 -0
careamics/lightning/dataset_ng/callbacks/__init__.py +1 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/__init__.py +29 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/cached_tiles_strategy.py +164 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/file_path_utils.py +33 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/prediction_writer_callback.py +219 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/write_image_strategy.py +91 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/write_strategy.py +27 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/write_strategy_factory.py +214 -0
careamics/lightning/dataset_ng/callbacks/prediction_writer/write_tiles_zarr_strategy.py +375 -0
careamics/lightning/dataset_ng/data_module.py +529 -0
careamics/lightning/dataset_ng/data_module_utils.py +395 -0
careamics/lightning/dataset_ng/lightning_modules/__init__.py +9 -0
careamics/lightning/dataset_ng/lightning_modules/care_module.py +97 -0
careamics/lightning/dataset_ng/lightning_modules/n2v_module.py +106 -0
careamics/lightning/dataset_ng/lightning_modules/unet_module.py +221 -0
careamics/lightning/dataset_ng/prediction/__init__.py +16 -0
careamics/lightning/dataset_ng/prediction/convert_prediction.py +198 -0
careamics/lightning/dataset_ng/prediction/stitch_prediction.py +171 -0
careamics/lightning/lightning_module.py +914 -0
careamics/lightning/microsplit_data_module.py +632 -0
careamics/lightning/predict_data_module.py +341 -0
careamics/lightning/train_data_module.py +666 -0
careamics/losses/__init__.py +21 -0
careamics/losses/fcn/__init__.py +1 -0
careamics/losses/fcn/losses.py +125 -0
careamics/losses/loss_factory.py +80 -0
careamics/losses/lvae/__init__.py +1 -0
careamics/losses/lvae/loss_utils.py +83 -0
careamics/losses/lvae/losses.py +589 -0
careamics/lvae_training/__init__.py +0 -0
careamics/lvae_training/calibration.py +191 -0
careamics/lvae_training/dataset/__init__.py +20 -0
careamics/lvae_training/dataset/config.py +135 -0
careamics/lvae_training/dataset/lc_dataset.py +274 -0
careamics/lvae_training/dataset/ms_dataset_ref.py +1067 -0
careamics/lvae_training/dataset/multich_dataset.py +1121 -0
careamics/lvae_training/dataset/multicrop_dset.py +196 -0
careamics/lvae_training/dataset/multifile_dataset.py +335 -0
careamics/lvae_training/dataset/types.py +32 -0
careamics/lvae_training/dataset/utils/__init__.py +0 -0
careamics/lvae_training/dataset/utils/data_utils.py +114 -0
careamics/lvae_training/dataset/utils/empty_patch_fetcher.py +65 -0
careamics/lvae_training/dataset/utils/index_manager.py +491 -0
careamics/lvae_training/dataset/utils/index_switcher.py +165 -0
careamics/lvae_training/eval_utils.py +987 -0
careamics/lvae_training/get_config.py +84 -0
careamics/lvae_training/lightning_module.py +701 -0
careamics/lvae_training/metrics.py +214 -0
careamics/lvae_training/train_lvae.py +342 -0
careamics/lvae_training/train_utils.py +121 -0
careamics/model_io/__init__.py +7 -0
careamics/model_io/bioimage/__init__.py +11 -0
careamics/model_io/bioimage/_readme_factory.py +113 -0
careamics/model_io/bioimage/bioimage_utils.py +56 -0
careamics/model_io/bioimage/cover_factory.py +171 -0
careamics/model_io/bioimage/model_description.py +341 -0
careamics/model_io/bmz_io.py +251 -0
careamics/model_io/model_io_utils.py +95 -0
careamics/models/__init__.py +5 -0
careamics/models/activation.py +40 -0
careamics/models/layers.py +495 -0
careamics/models/lvae/__init__.py +3 -0
careamics/models/lvae/layers.py +1371 -0
careamics/models/lvae/likelihoods.py +394 -0
careamics/models/lvae/lvae.py +848 -0
careamics/models/lvae/noise_models.py +738 -0
careamics/models/lvae/stochastic.py +394 -0
careamics/models/lvae/utils.py +404 -0
careamics/models/model_factory.py +54 -0
careamics/models/unet.py +449 -0
careamics/nm_training_placeholder.py +203 -0
careamics/prediction_utils/__init__.py +21 -0
careamics/prediction_utils/lvae_prediction.py +158 -0
careamics/prediction_utils/lvae_tiling_manager.py +362 -0
careamics/prediction_utils/prediction_outputs.py +238 -0
careamics/prediction_utils/stitch_prediction.py +193 -0
careamics/py.typed +5 -0
careamics/transforms/__init__.py +22 -0
careamics/transforms/compose.py +173 -0
careamics/transforms/n2v_manipulate.py +150 -0
careamics/transforms/n2v_manipulate_torch.py +149 -0
careamics/transforms/normalize.py +374 -0
careamics/transforms/pixel_manipulation.py +406 -0
careamics/transforms/pixel_manipulation_torch.py +388 -0
careamics/transforms/struct_mask_parameters.py +20 -0
careamics/transforms/transform.py +24 -0
careamics/transforms/tta.py +88 -0
careamics/transforms/xy_flip.py +131 -0
careamics/transforms/xy_random_rotate90.py +108 -0
careamics/utils/__init__.py +19 -0
careamics/utils/autocorrelation.py +40 -0
careamics/utils/base_enum.py +60 -0
careamics/utils/context.py +67 -0
careamics/utils/deprecation.py +63 -0
careamics/utils/lightning_utils.py +71 -0
careamics/utils/logging.py +323 -0
careamics/utils/metrics.py +394 -0
careamics/utils/path_utils.py +26 -0
careamics/utils/plotting.py +76 -0
careamics/utils/ram.py +15 -0
careamics/utils/receptive_field.py +108 -0
careamics/utils/serializers.py +62 -0
careamics/utils/torch_utils.py +150 -0
careamics/utils/version.py +38 -0
careamics-0.0.19.dist-info/METADATA +80 -0
careamics-0.0.19.dist-info/RECORD +279 -0
careamics-0.0.19.dist-info/WHEEL +4 -0
careamics-0.0.19.dist-info/entry_points.txt +2 -0
careamics-0.0.19.dist-info/licenses/LICENSE +28 -0

careamics/dataset_ng/patching_strategies/random_patching.py ADDED Viewed

@@ -0,0 +1,393 @@
+"""A module for random patching strategies."""
+from collections.abc import Sequence
+import numpy as np
+from .patching_strategy_protocol import PatchSpecs
+class RandomPatchingStrategy:
+    """
+    A patching strategy for sampling random patches, it implements the
+    `PatchingStrategy` `Protocol`.
+    The output of `get_patch_spec` will be random, i.e. if the same index is given
+    twice the two outputs can be different.
+    However the strategy still ensures that there will be a known number of patches for
+    each sample in each image stack. This is achieved through defining a set of bins
+    that map to each sample in each image stack. Whichever bin an `index` passed to
+    `get_patch_spec` falls into, determines the `"data_idx"` and `"sample_idx"` in
+    the returned `PatchSpecs`, but the `"coords"` will be random.
+    The number of patches in each sample is based on the number of patches that would
+    fit if they were sampled sequentially, non-overlapping, and covering the entire
+    array.
+    """
+    def __init__(
+        self,
+        data_shapes: Sequence[Sequence[int]],
+        patch_size: Sequence[int],
+        seed: int | None = None,
+    ):
+        """
+        A patching strategy for sampling random patches.
+        Parameters
+        ----------
+        data_shapes : sequence of (sequence of int)
+            The shapes of the underlying data. Each element is the dimension of the
+            axes SC(Z)YX.
+        patch_size : sequence of int
+            The size of the patch. The sequence will have length 2 or 3, for 2D and 3D
+            data respectively.
+        seed : int, optional
+            An optional seed to ensure the reproducibility of the random patches.
+        """
+        self.rng = np.random.default_rng(seed=seed)
+        self.patch_size = patch_size
+        self.data_shapes = data_shapes
+        # these bins will determine which image stack and sample a patch comes from
+        # the image_stack_cumulative_patches map a patch index to each image stack
+        # the sample_cumulative_patches map a patch index to each sample
+        # the image_stack_cumulative_samples map a sample index to each image stack
+        (
+            self.image_stack_cumulative_patches,
+            self.sample_cumulative_patches,
+            self.image_stack_cumulative_samples,
+        ) = self._calc_bins(self.data_shapes, self.patch_size)
+    @property
+    def n_patches(self) -> int:
+        """
+        The number of patches that this patching strategy will return.
+        It also determines the maximum index that can be given to `get_patch_spec`.
+        """
+        # last bin boundary will be total patches
+        return self.image_stack_cumulative_patches[-1]
+    def get_patch_spec(self, index: int) -> PatchSpecs:
+        """Return the patch specs for a given index.
+        Parameters
+        ----------
+        index : int
+            A patch index.
+        Returns
+        -------
+        PatchSpecs
+            A dictionary that specifies a single patch in a series of `ImageStacks`.
+        """
+        # TODO: break into smaller testable functions?
+        if index >= self.n_patches:
+            raise IndexError(
+                f"Index {index} out of bounds for RandomPatchingStrategy with number "
+                f"of patches {self.n_patches}"
+            )
+        # digitize returns the bin that `index` belongs to
+        data_index = np.digitize(index, bins=self.image_stack_cumulative_patches).item()
+        # maps to a particular sample within the whole series of image stacks
+        #   (not just a single image stack)
+        total_samples_index = np.digitize(
+            index, bins=self.sample_cumulative_patches
+        ).item()
+        data_shape = self.data_shapes[data_index]
+        spatial_shape = data_shape[2:]
+        # calculate sample index relative to image stack:
+        #   subtract the total number of samples in the previous image stacks
+        if data_index == 0:
+            n_previous_samples = 0
+        else:
+            n_previous_samples = self.image_stack_cumulative_samples[data_index - 1]
+        sample_index = total_samples_index - n_previous_samples
+        coords = _generate_random_coords(spatial_shape, self.patch_size, self.rng)
+        return {
+            "data_idx": data_index,
+            "sample_idx": sample_index,
+            "coords": coords,
+            "patch_size": self.patch_size,
+        }
+    # Note: this is used by the FileIterSampler
+    def get_patch_indices(self, data_idx: int) -> Sequence[int]:
+        """
+        Get the patch indices will return patches for a specific `image_stack`.
+        The `image_stack` corresponds to the given `data_idx`.
+        Parameters
+        ----------
+        data_idx : int
+            An index that corresponds to a given `image_stack`.
+        Returns
+        -------
+        sequence of int
+            A sequence of patch indices, that when used to index the `CAREamicsDataset
+            will return a patch that comes from the `image_stack` corresponding to the
+            given `data_idx`.
+        """
+        # return all the values in the corresponding bin
+        if data_idx == 0:
+            start = 0
+        else:
+            start = self.image_stack_cumulative_patches[data_idx - 1]
+        return np.arange(start, self.image_stack_cumulative_patches[data_idx]).tolist()
+    @staticmethod
+    def _calc_bins(
+        data_shapes: Sequence[Sequence[int]], patch_size: Sequence[int]
+    ) -> tuple[tuple[int, ...], tuple[int, ...], tuple[int, ...]]:
+        """Calculate bins used to map an index to an image_stack and a sample.
+        The number of patches in each sample is based on the number of patches that
+        would fit if they were sampled sequentially.
+        Parameters
+        ----------
+        data_shapes : sequence of (sequence of int)
+            The shapes of the underlying data. Each element is the dimension of the
+            axes SC(Z)YX.
+        patch_size : sequence of int
+            The size of the patch. The sequence will have length 2 or 3, for 2D and 3D
+            data respectively.
+        Returns
+        -------
+        image_stack_cumulative_patches: tuple of int
+            The bins that map a patch index to an image stack. E.g. if a patch index
+            falls below the first bin boundary it belongs to the first image stack, if
+            a patch index falls between the first bin boundary and the second bin
+            boundary it belongs to the second image stack, and so on.
+        sample_cumulative_patches: tuple of int
+            The bins that map a patch index to a sample. E.g. if a patch index
+            falls below the first bin boundary it belongs to the first sample, if
+            a patch index falls between the first bin boundary and the second bin
+            boundary it belongs to the second sample, and so on.
+        image_stack_cumulative_samples: tuple of int
+            The bins that map a sample index to an image stack. E.g. if a sample index
+            falls below the first bin boundary it belongs to the first image stack, if
+            a patch index falls between the first bin boundary and the second bin
+            boundary it belongs to the second image stack, and so on.
+        """
+        patches_per_image_stack: list[int] = []
+        patches_per_sample: list[int] = []
+        samples_per_image_stack: list[int] = []
+        for data_shape in data_shapes:
+            spatial_shape = data_shape[2:]
+            n_single_sample_patches = _calc_n_patches(spatial_shape, patch_size)
+            # multiply by number of samples in image_stack
+            patches_per_image_stack.append(n_single_sample_patches * data_shape[0])
+            # list of length `sample` filled with `n_single_sample_patches`
+            patches_per_sample.extend([n_single_sample_patches] * data_shape[0])
+            # number of samples in each image stack
+            samples_per_image_stack.append(data_shape[0])
+        # cumulative sum creates the bins
+        image_stack_cumulative_patches = np.cumsum(patches_per_image_stack)
+        sample_cumulative_patches = np.cumsum(patches_per_sample)
+        image_stack_cumulative_samples = np.cumsum(samples_per_image_stack)
+        return (
+            tuple(image_stack_cumulative_patches),
+            tuple(sample_cumulative_patches),
+            tuple(image_stack_cumulative_samples),
+        )
+class FixedRandomPatchingStrategy:
+    """
+    A patching strategy for sampling random patches it implements the `PatchingStrategy`
+    `Protocol`.
+    The output of `get_patch_spec` will be deterministic, i.e. if the same index is
+    given twice the two outputs will be the same.
+    The number of patches in each sample is based on the number of patches that would
+    fit if they were sampled sequentially, non-overlapping, and covering the entire
+    array.
+    """
+    def __init__(
+        self,
+        data_shapes: Sequence[Sequence[int]],
+        patch_size: Sequence[int],
+        seed: int | None = None,
+    ):
+        """A patching strategy for sampling random patches.
+        Parameters
+        ----------
+        data_shapes : sequence of (sequence of int)
+            The shapes of the underlying data. Each element is the dimension of the
+            axes SC(Z)YX.
+        patch_size : sequence of int
+            The size of the patch. The sequence will have length 2 or 3, for 2D and 3D
+            data respectively.
+        seed : int, optional
+            An optional seed to ensure the reproducibility of the random patches.
+        """
+        self.rng = np.random.default_rng(seed=seed)
+        self.patch_size = patch_size
+        self.data_shapes = data_shapes
+        # simply generate all the patches at initialisation, so they will be fixed
+        self.fixed_patch_specs: list[PatchSpecs] = []
+        for data_idx, data_shape in enumerate(self.data_shapes):
+            spatial_shape = data_shape[2:]
+            n_patches = _calc_n_patches(spatial_shape, self.patch_size)
+            for sample_idx in range(data_shape[0]):
+                for _ in range(n_patches):
+                    random_coords = _generate_random_coords(
+                        spatial_shape, self.patch_size, self.rng
+                    )
+                    patch_specs: PatchSpecs = {
+                        "data_idx": data_idx,
+                        "sample_idx": sample_idx,
+                        "coords": random_coords,
+                        "patch_size": self.patch_size,
+                    }
+                    self.fixed_patch_specs.append(patch_specs)
+    @property
+    def n_patches(self):
+        """
+        The number of patches that this patching strategy will return.
+        It also determines the maximum index that can be given to `get_patch_spec`.
+        """
+        return len(self.fixed_patch_specs)
+    def get_patch_spec(self, index: int) -> PatchSpecs:
+        """Return the patch specs for a given index.
+        Parameters
+        ----------
+        index : int
+            A patch index.
+        Returns
+        -------
+        PatchSpecs
+            A dictionary that specifies a single patch in a series of `ImageStacks`.
+        """
+        if index >= self.n_patches:
+            raise IndexError(
+                f"Index {index} out of bounds for FixedRandomPatchingStrategy with "
+                f"number of patches, {self.n_patches}"
+            )
+        # simply index the pre-generated patches to get the correct patch
+        return self.fixed_patch_specs[index]
+    # Note: this is used by the FileIterSampler
+    def get_patch_indices(self, data_idx: int) -> Sequence[int]:
+        """
+        Get the patch indices will return patches for a specific `image_stack`.
+        The `image_stack` corresponds to the given `data_idx`.
+        Parameters
+        ----------
+        data_idx : int
+            An index that corresponds to a given `image_stack`.
+        Returns
+        -------
+        sequence of int
+            A sequence of patch indices, that when used to index the `CAREamicsDataset
+            will return a patch that comes from the `image_stack` corresponding to the
+            given `data_idx`.
+        """
+        return [
+            i
+            for i, patch_spec in enumerate(self.fixed_patch_specs)
+            if patch_spec["data_idx"] == data_idx
+        ]
+def _generate_random_coords(
+    spatial_shape: Sequence[int], patch_size: Sequence[int], rng: np.random.Generator
+) -> tuple[int, ...]:
+    """Generate random patch coordinates for a given `spatial_shape` and `patch_size`.
+    The coords are the top-left (and first z-slice for 3D data) of a patch. The
+    sequence will have length 2 or 3, for 2D and 3D data respectively.
+    Parameters
+    ----------
+    spatial_shape : sequence of int
+        The dimension of the axes (Z)YX, a sequence of length 2 or 3, for 2D and 3D
+        data respectively.
+    patch_size : sequence of int
+        The size of the patch. The sequence will have length 2 or 3, for 2D and 3D
+        data respectively.
+    rng : numpy.random.Generator
+        A numpy generator to ensure the reproducibility of the random patches.
+    Returns
+    -------
+    coords: tuple of int
+        The top-left (and first z-slice for 3D data) coords of a patch. The tuple will
+        have length 2 or 3, for 2D and 3D data respectively.
+    Raises
+    ------
+    ValueError
+        Raises if the number of spatial dimensions do not match the number of patch
+        dimensions.
+    """
+    if len(patch_size) != len(spatial_shape):
+        raise ValueError(
+            f"Number of patch dimension {len(patch_size)}, do not match the number of "
+            f"spatial dimensions {len(spatial_shape)}, for `patch_size={patch_size}` "
+            f"and `spatial_shape={spatial_shape}`."
+        )
+    return tuple(
+        rng.integers(
+            np.zeros(len(patch_size), dtype=int),
+            np.clip(np.array(spatial_shape) - np.array(patch_size), 0, None),
+            endpoint=True,
+            dtype=int,
+        ).tolist()
+    )
+def _calc_n_patches(spatial_shape: Sequence[int], patch_size: Sequence[int]) -> int:
+    """
+    Calculates the number of patches for a given `spatial_shape` and `patch_size`.
+    This is based on the number of patches that would fit if they were sampled
+    sequentially.
+    Parameters
+    ----------
+    spatial_shape : sequence of int
+        The dimension of the axes (Z)YX, a sequence of length 2 or 3, for 2D and 3D
+        data respectively.
+    patch_size : sequence of int
+        The size of the patch. The sequence will have length 2 or 3, for 2D and 3D
+        data respectively.
+    Returns
+    -------
+    int
+        The number of patches.
+    """
+    if len(patch_size) != len(spatial_shape):
+        raise ValueError(
+            f"Number of patch dimension {len(patch_size)}, do not match the number of "
+            f"spatial dimensions {len(spatial_shape)}, for `patch_size={patch_size}` "
+            f"and `spatial_shape={spatial_shape}`."
+        )
+    patches_per_dim = [
+        np.ceil(s / p) for s, p in zip(spatial_shape, patch_size, strict=False)
+    ]
+    total_patches = int(np.prod(patches_per_dim))
+    return total_patches

careamics/dataset_ng/patching_strategies/sequential_patching.py ADDED Viewed

@@ -0,0 +1,99 @@
+import itertools
+from collections.abc import Sequence
+import numpy as np
+from typing_extensions import ParamSpec
+from .patching_strategy_protocol import PatchSpecs
+P = ParamSpec("P")
+# TODO: this is an unfinished prototype based on current tiling implementation
+#  not guaranteed to work!
+class SequentialPatchingStrategy:
+    # TODO: docs
+    def __init__(
+        self,
+        data_shapes: Sequence[Sequence[int]],
+        patch_size: Sequence[int],
+        overlaps: Sequence[int] | None = None,
+    ):
+        self.data_shapes = data_shapes
+        self.patch_size = patch_size
+        if overlaps is None:
+            overlaps = [0] * len(patch_size)
+        self.overlaps = np.asarray(overlaps)
+        self.patch_specs: list[PatchSpecs] = self._initialize_patch_specs()
+    @property
+    def n_patches(self) -> int:
+        return len(self.patch_specs)
+    def get_patch_spec(self, index: int) -> PatchSpecs:
+        return self.patch_specs[index]
+    # Note: this is used by the FileIterSampler
+    def get_patch_indices(self, data_idx: int) -> Sequence[int]:
+        """
+        Get the patch indices will return patches for a specific `image_stack`.
+        The `image_stack` corresponds to the given `data_idx`.
+        Parameters
+        ----------
+        data_idx : int
+            An index that corresponds to a given `image_stack`.
+        Returns
+        -------
+        sequence of int
+            A sequence of patch indices, that when used to index the `CAREamicsDataset
+            will return a patch that comes from the `image_stack` corresponding to the
+            given `data_idx`.
+        """
+        return [
+            i
+            for i, patch_spec in enumerate(self.patch_specs)
+            if patch_spec["data_idx"] == data_idx
+        ]
+    def _compute_coords_1d(
+        self, patch_size: int, spatial_shape: int, overlap: int
+    ) -> list[tuple[int, int]]:
+        step = patch_size - overlap
+        crop_coords = []
+        current_pos = 0
+        while current_pos <= spatial_shape - patch_size:
+            crop_coords.append((current_pos, current_pos + patch_size))
+            current_pos += step
+        if crop_coords[-1][1] < spatial_shape:
+            crop_coords.append((spatial_shape - patch_size, spatial_shape))
+        return crop_coords
+    def _initialize_patch_specs(self) -> list[PatchSpecs]:
+        patch_specs: list[PatchSpecs] = []
+        for data_idx, data_shape in enumerate(self.data_shapes):
+            data_spatial_shape = data_shape[-len(self.patch_size) :]
+            coords_list = [
+                self._compute_coords_1d(
+                    self.patch_size[i], data_spatial_shape[i], self.overlaps[i]
+                )
+                for i in range(len(self.patch_size))
+            ]
+            for sample_idx in range(data_shape[0]):
+                for crop_coord in itertools.product(*coords_list):
+                    patch_specs.append(
+                        PatchSpecs(
+                            data_idx=data_idx,
+                            sample_idx=sample_idx,
+                            coords=tuple(coord[0] for coord in crop_coord),
+                            patch_size=self.patch_size,
+                        )
+                    )
+        return patch_specs

careamics/dataset_ng/patching_strategies/tiling_strategy.py ADDED Viewed

@@ -0,0 +1,207 @@
+"""Module for the `TilingStrategy` class."""
+import itertools
+from collections.abc import Sequence
+from math import prod
+from .patching_strategy_protocol import TileSpecs
+class TilingStrategy:
+    """
+    The tiling strategy should be used for prediction. The `get_patch_specs`
+    method returns `TileSpec` dictionaries that contains information on how to
+    stitch the tiles back together to create the full image.
+    """
+    def __init__(
+        self,
+        data_shapes: Sequence[Sequence[int]],
+        patch_size: Sequence[int],
+        overlaps: Sequence[int],
+    ):
+        """
+        The tiling strategy should be used for prediction. The `get_patch_specs`
+        method returns `TileSpec` dictionaries that contains information on how to
+        stitch the tiles back together to create the full image.
+        Parameters
+        ----------
+        data_shapes : sequence of (sequence of int)
+            The shapes of the underlying data. Each element is the dimension of the
+            axes SC(Z)YX.
+        patch_size : sequence of int
+            The size of the tile. The sequence will have length 2 or 3, for 2D and 3D
+            data respectively.
+        overlaps : sequence of int
+            How much a tile will overlap with adjacent tiles in each spatial dimension.
+        """
+        self.data_shapes = data_shapes
+        self.patch_size = patch_size
+        self.overlaps = overlaps
+        # patch_size and overlap should have same length validated in pydantic configs
+        self.tile_specs: list[TileSpecs] = self._generate_specs()
+    @property
+    def n_patches(self) -> int:
+        """
+        The number of patches that this patching strategy will return.
+        It also determines the maximum index that can be given to `get_patch_spec`.
+        """
+        return len(self.tile_specs)
+    def get_patch_spec(self, index: int) -> TileSpecs:
+        """Return the tile specs for a given index.
+        Parameters
+        ----------
+        index : int
+            A patch index.
+        Returns
+        -------
+        TileSpecs
+            A dictionary that specifies a single patch in a series of `ImageStacks`.
+        """
+        return self.tile_specs[index]
+    # Note: this is used by the FileIterSampler
+    def get_patch_indices(self, data_idx: int) -> Sequence[int]:
+        """
+        Get the patch indices will return patches for a specific `image_stack`.
+        The `image_stack` corresponds to the given `data_idx`.
+        Parameters
+        ----------
+        data_idx : int
+            An index that corresponds to a given `image_stack`.
+        Returns
+        -------
+        sequence of int
+            A sequence of patch indices, that when used to index the `CAREamicsDataset
+            will return a patch that comes from the `image_stack` corresponding to the
+            given `data_idx`.
+        """
+        return [
+            i
+            for i, patch_spec in enumerate(self.tile_specs)
+            if patch_spec["data_idx"] == data_idx
+        ]
+    def _generate_specs(self) -> list[TileSpecs]:
+        tile_specs: list[TileSpecs] = []
+        for data_idx, data_shape in enumerate(self.data_shapes):
+            spatial_shape = data_shape[2:]
+            # spec info for each axis
+            axis_specs: list[tuple[list[int], list[int], list[int], list[int]]] = [
+                self._compute_1d_coords(
+                    axis_size, self.patch_size[axis_idx], self.overlaps[axis_idx]
+                )
+                for axis_idx, axis_size in enumerate(spatial_shape)
+            ]
+            # combine by using zip
+            all_coords, all_stitch_coords, all_crop_coords, all_crop_size = zip(
+                *axis_specs, strict=False
+            )
+            # number of tiles for this data_idx
+            n_tiles = prod(len(dim) for dim in all_coords) * data_shape[0]
+            # patches will be the same for each sample in a stack
+            for sample_idx in range(data_shape[0]):
+                # iterate through all combinations using itertools.product
+                for coords, stitch_coords, crop_coords, crop_size in zip(
+                    itertools.product(*all_coords),
+                    itertools.product(*all_stitch_coords),
+                    itertools.product(*all_crop_coords),
+                    itertools.product(*all_crop_size),
+                    strict=False,
+                ):
+                    tile_specs.append(
+                        {
+                            # PatchSpecs
+                            "data_idx": data_idx,
+                            "sample_idx": sample_idx,
+                            "coords": coords,
+                            "patch_size": self.patch_size,
+                            # TileSpecs additional fields
+                            "crop_coords": crop_coords,
+                            "crop_size": crop_size,
+                            "stitch_coords": stitch_coords,
+                            "total_tiles": n_tiles,
+                        }
+                    )
+        return tile_specs
+    @staticmethod
+    def _compute_1d_coords(
+        axis_size: int, patch_size: int, overlap: int
+    ) -> tuple[list[int], list[int], list[int], list[int]]:
+        """
+        Computes the TileSpec information for a single axis.
+        Parameters
+        ----------
+        axis_size : int
+            The size of the axis.
+        patch_size : int
+            The tile size.
+        overlap : int
+            The tile overlap.
+        Returns
+        -------
+        coords: list of int
+            The top-left (and first z-slice for 3D data) of a tile, in coords relative
+            to the image.
+        stitch_coords: list of int
+            Where the tile will be stitched back into an image, taking into account
+            that the tile will be cropped, in coords relative to the image.
+        crop_coords: list of int
+            The top-left side of where the tile will be cropped, in coordinates relative
+            to the tile.
+        crop_size: list of int
+            The size of the cropped tile.
+        """
+        coords: list[int] = []
+        stitch_coords: list[int] = []
+        crop_coords: list[int] = []
+        crop_size: list[int] = []
+        step = patch_size - overlap
+        for i in range(0, max(1, axis_size - overlap), step):
+            if i == 0:
+                coords.append(i)
+                crop_coords.append(0)
+                stitch_coords.append(0)
+                if axis_size <= patch_size:
+                    crop_size.append(axis_size)
+                else:
+                    crop_size.append(patch_size - overlap // 2)
+            elif (0 < i) and (i + patch_size < axis_size):
+                coords.append(i)
+                crop_coords.append(overlap // 2)
+                stitch_coords.append(coords[-1] + crop_coords[-1])
+                crop_size.append(patch_size - overlap)
+            else:
+                previous_crop_size = crop_size[-1] if crop_size else 1
+                previous_stitch_coord = stitch_coords[-1] if stitch_coords else 0
+                previous_tile_end = previous_stitch_coord + previous_crop_size
+                coords.append(max(0, axis_size - patch_size))
+                stitch_coords.append(previous_tile_end)
+                crop_coords.append(stitch_coords[-1] - coords[-1])
+                crop_size.append(axis_size - stitch_coords[-1])
+        return (
+            coords,
+            stitch_coords,
+            crop_coords,
+            crop_size,
+        )