PyPI - careamics - Versions diffs - 0.1.0rc1__py3-none-any.whl → 0.1.0rc3__py3-none-any.whl - Mend

careamics 0.1.0rc1py3-none-any.whl → 0.1.0rc3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of careamics might be problematic. Click here for more details.

Files changed (132) hide show

careamics/__init__.py +14 -4
careamics/callbacks/__init__.py +6 -0
careamics/callbacks/hyperparameters_callback.py +42 -0
careamics/callbacks/progress_bar_callback.py +57 -0
careamics/careamist.py +761 -0
careamics/config/__init__.py +27 -3
careamics/config/algorithm_model.py +167 -0
careamics/config/architectures/__init__.py +17 -0
careamics/config/architectures/architecture_model.py +29 -0
careamics/config/architectures/custom_model.py +150 -0
careamics/config/architectures/register_model.py +101 -0
careamics/config/architectures/unet_model.py +96 -0
careamics/config/architectures/vae_model.py +39 -0
careamics/config/callback_model.py +92 -0
careamics/config/configuration_factory.py +460 -0
careamics/config/configuration_model.py +596 -0
careamics/config/data_model.py +555 -0
careamics/config/inference_model.py +283 -0
careamics/config/noise_models.py +162 -0
careamics/config/optimizer_models.py +181 -0
careamics/config/references/__init__.py +45 -0
careamics/config/references/algorithm_descriptions.py +131 -0
careamics/config/references/references.py +38 -0
careamics/config/support/__init__.py +33 -0
careamics/config/support/supported_activations.py +24 -0
careamics/config/support/supported_algorithms.py +18 -0
careamics/config/support/supported_architectures.py +18 -0
careamics/config/support/supported_data.py +82 -0
careamics/{dataset/extraction_strategy.py → config/support/supported_extraction_strategies.py} +5 -2
careamics/config/support/supported_loggers.py +8 -0
careamics/config/support/supported_losses.py +25 -0
careamics/config/support/supported_optimizers.py +55 -0
careamics/config/support/supported_pixel_manipulations.py +15 -0
careamics/config/support/supported_struct_axis.py +19 -0
careamics/config/support/supported_transforms.py +23 -0
careamics/config/tile_information.py +104 -0
careamics/config/training_model.py +65 -0
careamics/config/transformations/__init__.py +14 -0
careamics/config/transformations/n2v_manipulate_model.py +63 -0
careamics/config/transformations/nd_flip_model.py +32 -0
careamics/config/transformations/normalize_model.py +31 -0
careamics/config/transformations/transform_model.py +44 -0
careamics/config/transformations/xy_random_rotate90_model.py +29 -0
careamics/config/validators/__init__.py +5 -0
careamics/config/validators/validator_utils.py +100 -0
careamics/conftest.py +26 -0
careamics/dataset/__init__.py +5 -0
careamics/dataset/dataset_utils/__init__.py +19 -0
careamics/dataset/dataset_utils/dataset_utils.py +100 -0
careamics/dataset/dataset_utils/file_utils.py +140 -0
careamics/dataset/dataset_utils/read_tiff.py +61 -0
careamics/dataset/dataset_utils/read_utils.py +25 -0
careamics/dataset/dataset_utils/read_zarr.py +56 -0
careamics/dataset/in_memory_dataset.py +321 -131
careamics/dataset/iterable_dataset.py +416 -0
careamics/dataset/patching/__init__.py +8 -0
careamics/dataset/patching/patch_transform.py +44 -0
careamics/dataset/patching/patching.py +212 -0
careamics/dataset/patching/random_patching.py +190 -0
careamics/dataset/patching/sequential_patching.py +206 -0
careamics/dataset/patching/tiled_patching.py +158 -0
careamics/dataset/patching/validate_patch_dimension.py +60 -0
careamics/dataset/zarr_dataset.py +149 -0
careamics/lightning_datamodule.py +665 -0
careamics/lightning_module.py +292 -0
careamics/lightning_prediction_datamodule.py +390 -0
careamics/lightning_prediction_loop.py +116 -0
careamics/losses/__init__.py +4 -1
careamics/losses/loss_factory.py +24 -13
careamics/losses/losses.py +65 -5
careamics/losses/noise_model_factory.py +40 -0
careamics/losses/noise_models.py +524 -0
careamics/model_io/__init__.py +8 -0
careamics/model_io/bioimage/__init__.py +11 -0
careamics/model_io/bioimage/_readme_factory.py +120 -0
careamics/model_io/bioimage/bioimage_utils.py +48 -0
careamics/model_io/bioimage/model_description.py +318 -0
careamics/model_io/bmz_io.py +231 -0
careamics/model_io/model_io_utils.py +80 -0
careamics/models/__init__.py +4 -1
careamics/models/activation.py +35 -0
careamics/models/layers.py +244 -0
careamics/models/model_factory.py +21 -202
careamics/models/unet.py +46 -20
careamics/prediction/__init__.py +1 -3
careamics/prediction/stitch_prediction.py +73 -0
careamics/transforms/__init__.py +41 -0
careamics/transforms/n2v_manipulate.py +113 -0
careamics/transforms/nd_flip.py +93 -0
careamics/transforms/normalize.py +109 -0
careamics/transforms/pixel_manipulation.py +383 -0
careamics/transforms/struct_mask_parameters.py +18 -0
careamics/transforms/tta.py +74 -0
careamics/transforms/xy_random_rotate90.py +95 -0
careamics/utils/__init__.py +10 -13
careamics/utils/base_enum.py +32 -0
careamics/utils/context.py +22 -2
careamics/utils/metrics.py +0 -46
careamics/utils/path_utils.py +24 -0
careamics/utils/ram.py +13 -0
careamics/utils/receptive_field.py +102 -0
careamics/utils/running_stats.py +43 -0
careamics/utils/torch_utils.py +89 -56
careamics-0.1.0rc3.dist-info/METADATA +122 -0
careamics-0.1.0rc3.dist-info/RECORD +109 -0
{careamics-0.1.0rc1.dist-info → careamics-0.1.0rc3.dist-info}/WHEEL +1 -1
careamics/bioimage/__init__.py +0 -15
careamics/bioimage/docs/Noise2Void.md +0 -5
careamics/bioimage/docs/__init__.py +0 -1
careamics/bioimage/io.py +0 -271
careamics/config/algorithm.py +0 -231
careamics/config/config.py +0 -296
careamics/config/config_filter.py +0 -44
careamics/config/data.py +0 -194
careamics/config/torch_optim.py +0 -118
careamics/config/training.py +0 -534
careamics/dataset/dataset_utils.py +0 -115
careamics/dataset/patching.py +0 -493
careamics/dataset/prepare_dataset.py +0 -174
careamics/dataset/tiff_dataset.py +0 -211
careamics/engine.py +0 -954
careamics/manipulation/__init__.py +0 -4
careamics/manipulation/pixel_manipulation.py +0 -158
careamics/prediction/prediction_utils.py +0 -102
careamics/utils/ascii_logo.txt +0 -9
careamics/utils/augment.py +0 -65
careamics/utils/normalization.py +0 -55
careamics/utils/validators.py +0 -156
careamics/utils/wandb.py +0 -121
careamics-0.1.0rc1.dist-info/METADATA +0 -80
careamics-0.1.0rc1.dist-info/RECORD +0 -46
{careamics-0.1.0rc1.dist-info → careamics-0.1.0rc3.dist-info}/licenses/LICENSE +0 -0

careamics/engine.py DELETED Viewed

@@ -1,954 +0,0 @@
-"""
-Engine module.
-This module contains the main CAREamics class, the Engine. The Engine allows training
-a model and using it for prediction.
-"""
-from logging import FileHandler
-from pathlib import Path
-from typing import Any, Dict, List, Optional, Tuple, Union
-import numpy as np
-import torch
-from bioimageio.spec.model.raw_nodes import Model as BioimageModel
-from torch.utils.data import DataLoader, TensorDataset
-from .bioimage import (
-    build_zip_model,
-    get_default_model_specs,
-)
-from .config import Configuration, load_configuration
-from .dataset.prepare_dataset import (
-    get_prediction_dataset,
-    get_train_dataset,
-    get_validation_dataset,
-)
-from .losses import create_loss_function
-from .models import create_model
-from .prediction import (
-    stitch_prediction,
-    tta_backward,
-    tta_forward,
-)
-from .utils import (
-    MetricTracker,
-    check_array_validity,
-    denormalize,
-    get_device,
-    normalize,
-)
-from .utils.logging import ProgressBar, get_logger
-# TODO: refactor private methods and bioimage.io to other modules
-class Engine:
-    """
-    Class allowing training of a model and subsequent prediction.
-    There are three ways to instantiate an Engine:
-    1. With a CAREamics model (.pth), by passing a path.
-    2. With a configuration object.
-    3. With a configuration file, by passing a path.
-    In each case, the parameter name must be provided explicitly. For example:
-    >>> engine = Engine(config_path="path/to/config.yaml")
-    Note that only one of these options can be used at a time, in the order listed
-    above.
-    Parameters
-    ----------
-    config : Optional[Configuration], optional
-        Configuration object, by default None.
-    config_path : Optional[Union[str, Path]], optional
-        Path to configuration file, by default None.
-    model_path : Optional[Union[str, Path]], optional
-        Path to model file, by default None.
-    seed : int, optional
-        Seed for reproducibility, by default 42.
-    Attributes
-    ----------
-    cfg : Configuration
-        Configuration.
-    device : torch.device
-        Device (CPU or GPU).
-    model : torch.nn.Module
-        Model.
-    optimizer : torch.optim.Optimizer
-        Optimizer.
-    lr_scheduler : torch.optim.lr_scheduler._LRScheduler
-        Learning rate scheduler.
-    scaler : torch.cuda.amp.GradScaler
-        Gradient scaler.
-    loss_func : Callable
-        Loss function.
-    logger : logging.Logger
-        Logger.
-    use_wandb : bool
-        Whether to use wandb.
-    """
-    def __init__(
-        self,
-        *,
-        config: Optional[Configuration] = None,
-        config_path: Optional[Union[str, Path]] = None,
-        model_path: Optional[Union[str, Path]] = None,
-        seed: Optional[int] = 42,
-    ) -> None:
-        """
-        Constructor.
-        To disable the seed, set it to None.
-        Parameters
-        ----------
-        config : Optional[Configuration], optional
-            Configuration object, by default None.
-        config_path : Optional[Union[str, Path]], optional
-            Path to configuration file, by default None.
-        model_path : Optional[Union[str, Path]], optional
-            Path to model file, by default None.
-        seed : int, optional
-            Seed for reproducibility, by default 42.
-        Raises
-        ------
-        ValueError
-            If all three parameters are None.
-        FileNotFoundError
-            If the model or configuration path is provided but does not exist.
-        TypeError
-            If the configuration is not a Configuration object.
-        UsageError
-            If wandb is not correctly installed.
-        ModuleNotFoundError
-            If wandb is not installed.
-        ValueError
-            If the configuration failed to configure.
-        """
-        if model_path is not None:
-            if not Path(model_path).exists():
-                raise FileNotFoundError(
-                    f"Model path {model_path} is incorrect or"
-                    f" does not exist. Current working directory is: {Path.cwd()!s}"
-                )
-            # Ensure that config is None
-            self.cfg = None
-        elif config is not None:
-            # Check that config is a Configuration object
-            if not isinstance(config, Configuration):
-                raise TypeError(
-                    f"config must be a Configuration object, got {type(config)}"
-                )
-            self.cfg = config
-        elif config_path is not None:
-            self.cfg = load_configuration(config_path)
-        else:
-            raise ValueError(
-                "No configuration or path provided. One of configuration "
-                "object, configuration path or model path must be provided."
-            )
-        # get device, CPU or GPU
-        self.device = get_device()
-        # Create model, optimizer, lr scheduler and gradient scaler and load everything
-        # to the specified device
-        (
-            self.model,
-            self.optimizer,
-            self.lr_scheduler,
-            self.scaler,
-            self.cfg,
-        ) = create_model(config=self.cfg, model_path=model_path, device=self.device)
-        # create loss function
-        if self.cfg is not None:
-            self.loss_func = create_loss_function(self.cfg)
-            # Set logging
-            log_path = self.cfg.working_directory / "log.txt"
-            self.logger = get_logger(__name__, log_path=log_path)
-            # wandb
-            self.use_wandb = self.cfg.training.use_wandb
-            if self.use_wandb:
-                try:
-                    from wandb.errors import UsageError
-                    from careamics.utils.wandb import WandBLogging
-                    try:
-                        self.wandb = WandBLogging(
-                            experiment_name=self.cfg.experiment_name,
-                            log_path=self.cfg.working_directory,
-                            config=self.cfg,
-                            model_to_watch=self.model,
-                        )
-                    except UsageError as e:
-                        self.logger.warning(
-                            f"Wandb usage error, using default logger. Check whether "
-                            f"wandb correctly configured:\n"
-                            f"{e}"
-                        )
-                        self.use_wandb = False
-                except ModuleNotFoundError:
-                    self.logger.warning(
-                        "Wandb not installed, using default logger. Try pip install "
-                        "wandb"
-                    )
-                    self.use_wandb = False
-        else:
-            raise ValueError("Configuration is not defined.")
-    def train(
-        self,
-        train_path: str,
-        val_path: str,
-    ) -> Tuple[List[Any], List[Any]]:
-        """
-        Train the network.
-        The training and validation data given by the paths must be compatible with the
-        axes and data format provided in the configuration.
-        Parameters
-        ----------
-        train_path : Union[str, Path]
-            Path to the training data.
-        val_path : Union[str, Path]
-            Path to the validation data.
-        Returns
-        -------
-        Tuple[List[Any], List[Any]]
-            Tuple of training and validation statistics.
-        Raises
-        ------
-        ValueError
-            Raise a ValueError if the configuration is missing.
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined, cannot train.")
-        # General func
-        train_loader = self._get_train_dataloader(train_path)
-        # Set mean and std from train dataset of none
-        if self.cfg.data.mean is None or self.cfg.data.std is None:
-            self.cfg.data.set_mean_and_std(
-                train_loader.dataset.mean, train_loader.dataset.std
-            )
-        eval_loader = self._get_val_dataloader(val_path)
-        self.logger.info(f"Starting training for {self.cfg.training.num_epochs} epochs")
-        val_losses = []
-        try:
-            train_stats = []
-            eval_stats = []
-            # loop over the dataset multiple times
-            for epoch in range(self.cfg.training.num_epochs):
-                if hasattr(train_loader.dataset, "__len__"):
-                    epoch_size = train_loader.__len__()
-                else:
-                    epoch_size = None
-                progress_bar = ProgressBar(
-                    max_value=epoch_size,
-                    epoch=epoch,
-                    num_epochs=self.cfg.training.num_epochs,
-                    mode="train",
-                )
-                # train_epoch = train_op(self._train_single_epoch,)
-                # Perform training step
-                train_outputs, epoch_size = self._train_single_epoch(
-                    train_loader,
-                    progress_bar,
-                    self.cfg.training.amp.use,
-                )
-                # Perform validation step
-                eval_outputs = self._evaluate(eval_loader)
-                val_losses.append(eval_outputs["loss"])
-                learning_rate = self.optimizer.param_groups[0]["lr"]
-                progress_bar.add(
-                    1,
-                    values=[
-                        ("train_loss", train_outputs["loss"]),
-                        ("val loss", eval_outputs["loss"]),
-                        ("lr", learning_rate),
-                    ],
-                )
-                # Add update scheduler rule based on type
-                self.lr_scheduler.step(eval_outputs["loss"])
-                if self.use_wandb:
-                    metrics = {
-                        "train": train_outputs,
-                        "eval": eval_outputs,
-                        "lr": learning_rate,
-                    }
-                    self.wandb.log_metrics(metrics)
-                train_stats.append(train_outputs)
-                eval_stats.append(eval_outputs)
-                checkpoint_path = self._save_checkpoint(epoch, val_losses, "state_dict")
-                self.logger.info(f"Saved checkpoint to {checkpoint_path}")
-        except KeyboardInterrupt:
-            self.logger.info("Training interrupted")
-        return train_stats, eval_stats
-    def _train_single_epoch(
-        self,
-        loader: torch.utils.data.DataLoader,
-        progress_bar: ProgressBar,
-        amp: bool,
-    ) -> Tuple[Dict[str, float], int]:
-        """
-        Train for a single epoch.
-        Parameters
-        ----------
-        loader : torch.utils.data.DataLoader
-            Training dataloader.
-        progress_bar : ProgressBar
-            Progress bar.
-        amp : bool
-            Whether to use automatic mixed precision.
-        Returns
-        -------
-        Tuple[Dict[str, float], int]
-            Tuple of training metrics and epoch size.
-        Raises
-        ------
-        ValueError
-            If the configuration is missing.
-        """
-        if self.cfg is not None:
-            avg_loss = MetricTracker()
-            self.model.train()
-            epoch_size = 0
-            for i, (batch, *auxillary) in enumerate(loader):
-                self.optimizer.zero_grad(set_to_none=True)
-                with torch.cuda.amp.autocast(enabled=amp):
-                    outputs = self.model(batch.to(self.device))
-                loss = self.loss_func(
-                    outputs, *[a.to(self.device) for a in auxillary], self.device
-                )
-                self.scaler.scale(loss).backward()
-                avg_loss.update(loss.detach(), batch.shape[0])
-                progress_bar.update(
-                    current_step=i,
-                    batch_size=self.cfg.training.batch_size,
-                )
-                self.optimizer.step()
-                epoch_size += 1
-            return {"loss": avg_loss.avg.to(torch.float16).cpu().numpy()}, epoch_size
-        else:
-            raise ValueError("Configuration is not defined, cannot train.")
-    def _evaluate(self, val_loader: torch.utils.data.DataLoader) -> Dict[str, float]:
-        """
-        Perform validation step.
-        Parameters
-        ----------
-        val_loader : torch.utils.data.DataLoader
-            Validation dataloader.
-        Returns
-        -------
-        Dict[str, float]
-            Loss value on the validation set.
-        """
-        self.model.eval()
-        avg_loss = MetricTracker()
-        with torch.no_grad():
-            for patch, *auxillary in val_loader:
-                outputs = self.model(patch.to(self.device))
-                loss = self.loss_func(
-                    outputs, *[a.to(self.device) for a in auxillary], self.device
-                )
-                avg_loss.update(loss.detach(), patch.shape[0])
-        return {"loss": avg_loss.avg.to(torch.float16).cpu().numpy()}
-    def predict(
-        self,
-        input: Union[np.ndarray, str, Path],
-        *,
-        tile_shape: Optional[List[int]] = None,
-        overlaps: Optional[List[int]] = None,
-        axes: Optional[str] = None,
-        tta: bool = True,
-    ) -> Union[np.ndarray, List[np.ndarray]]:
-        """
-        Predict using the current model on an input array or a path to data.
-        The Engine must have previously been trained and mean/std be specified in
-        its configuration.
-        To use tiling, both `tile_shape` and `overlaps` must be specified, have same
-        length, be divisible by 2 and greater than 0. Finally, the overlaps must be
-        smaller than the tiles.
-        Parameters
-        ----------
-        input : Union[np.ndarra, str, Path]
-            Input data, either an array or a path to the data.
-        tile_shape : Optional[List[int]], optional
-            2D or 3D shape of the tiles to be predicted, by default None.
-        overlaps : Optional[List[int]], optional
-            2D or 3D overlaps between tiles, by default None.
-        axes : Optional[str], optional
-            Axes of the input array if different from the one in the configuration, by
-            default None.
-        tta : bool, optional
-            Whether to use test time augmentation, by default True.
-        Returns
-        -------
-        Union[np.ndarray, List[np.ndarray]]
-            Predicted image array of the same shape as the input, or list of arrays
-            if the arrays have inconsistent shapes.
-        Raises
-        ------
-        ValueError
-            If the configuration is missing.
-        ValueError
-            If the mean or std are not specified in the configuration (untrained model).
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined, cannot predict.")
-        # Check that the mean and std are there (= has been trained)
-        if not self.cfg.data.mean or not self.cfg.data.std:
-            raise ValueError(
-                "Mean or std are not specified in the configuration, prediction cannot "
-                "be performed."
-            )
-        # set model to eval mode
-        self.model.to(self.device)
-        self.model.eval()
-        progress_bar = ProgressBar(num_epochs=1, mode="predict")
-        # Get dataloader
-        pred_loader, tiled = self._get_predict_dataloader(
-            input=input, tile_shape=tile_shape, overlaps=overlaps, axes=axes
-        )
-        # Start prediction
-        self.logger.info("Starting prediction")
-        if tiled:
-            self.logger.info("Starting tiled prediction")
-            prediction = self._predict_tiled(pred_loader, progress_bar, tta)
-        else:
-            self.logger.info("Starting prediction on whole sample")
-            prediction = self._predict_full(pred_loader, progress_bar, tta)
-        return prediction
-    def _predict_tiled(
-        self, pred_loader: DataLoader, progress_bar: ProgressBar, tta: bool = True
-    ) -> Union[np.ndarray, List[np.ndarray]]:
-        """
-        Predict using tiling.
-        Parameters
-        ----------
-        pred_loader : DataLoader
-            Prediction dataloader.
-        progress_bar : ProgressBar
-            Progress bar.
-        tta : bool, optional
-            Whether to use test time augmentation, by default True.
-        Returns
-        -------
-        Union[np.ndarray, List[np.ndarray]]
-            Predicted image, or list of predictions if the images have different sizes.
-        Warns
-        -----
-        UserWarning
-            If the samples have different shapes, the prediction then returns a list.
-        """
-        prediction = []
-        tiles = []
-        stitching_data = []
-        with torch.no_grad():
-            for i, (tile, *auxillary) in enumerate(pred_loader):
-                # Unpack auxillary data into last tile indicator and data, required to
-                # stitch tiles together
-                if auxillary:
-                    last_tile, *data = auxillary
-                if tta:
-                    augmented_tiles = tta_forward(tile)
-                    predicted_augments = []
-                    for augmented_tile in augmented_tiles:
-                        augmented_pred = self.model(augmented_tile.to(self.device))
-                        predicted_augments.append(
-                            augmented_pred.squeeze().cpu().numpy()
-                        )
-                    tiles.append(tta_backward(predicted_augments).squeeze())
-                else:
-                    tiles.append(
-                        self.model(tile.to(self.device)).squeeze().cpu().numpy()
-                    )
-                stitching_data.append(data)
-                if last_tile:
-                    # Stitch tiles together if sample is finished
-                    predicted_sample = stitch_prediction(tiles, stitching_data)
-                    predicted_sample = denormalize(
-                        predicted_sample,
-                        float(self.cfg.data.mean),  # type: ignore
-                        float(self.cfg.data.std),  # type: ignore
-                    )
-                    prediction.append(predicted_sample)
-                    tiles.clear()
-                    stitching_data.clear()
-                progress_bar.update(i, 1)
-        if tta:
-            i = int(i / 8)
-        self.logger.info(f"Predicted {len(prediction)} samples, {i} tiles in total")
-        try:
-            return np.stack(prediction)
-        except ValueError:
-            self.logger.warning("Samples have different shapes, returning list.")
-            return prediction
-    def _predict_full(
-        self, pred_loader: DataLoader, progress_bar: ProgressBar, tta: bool = True
-    ) -> np.ndarray:
-        """
-        Predict whole image without tiling.
-        Parameters
-        ----------
-        pred_loader : DataLoader
-            Prediction dataloader.
-        progress_bar : ProgressBar
-            Progress bar.
-        tta : bool, optional
-            Whether to use test time augmentation, by default True.
-        Returns
-        -------
-        np.ndarray
-            Predicted image.
-        """
-        prediction = []
-        with torch.no_grad():
-            for i, sample in enumerate(pred_loader):
-                if tta:
-                    augmented_preds = tta_forward(sample[0])
-                    predicted_augments = []
-                    for augmented_pred in augmented_preds:
-                        augmented_pred = self.model(augmented_pred.to(self.device))
-                        predicted_augments.append(
-                            augmented_pred.squeeze().cpu().numpy()
-                        )
-                    prediction.append(tta_backward(predicted_augments).squeeze())
-                else:
-                    prediction.append(
-                        self.model(sample[0].to(self.device)).squeeze().cpu().numpy()
-                    )
-                progress_bar.update(i, 1)
-        output = denormalize(
-            np.stack(prediction), float(self.cfg.data.mean), float(self.cfg.data.std)  # type: ignore
-        )
-        return output
-    def _get_train_dataloader(self, train_path: str) -> DataLoader:
-        """
-        Return a training dataloader.
-        Parameters
-        ----------
-        train_path : str
-            Path to the training data.
-        Returns
-        -------
-        DataLoader
-            Training data loader.
-        Raises
-        ------
-        ValueError
-            If the training configuration is None.
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined.")
-        dataset = get_train_dataset(self.cfg, train_path)
-        dataloader = DataLoader(
-            dataset,
-            batch_size=self.cfg.training.batch_size,
-            num_workers=self.cfg.training.num_workers,
-            pin_memory=True,
-        )
-        return dataloader
-    def _get_val_dataloader(self, val_path: str) -> DataLoader:
-        """
-        Return a validation dataloader.
-        Parameters
-        ----------
-        val_path : str
-            Path to the validation data.
-        Returns
-        -------
-        DataLoader
-            Validation data loader.
-        Raises
-        ------
-        ValueError
-            If the configuration is None.
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined.")
-        dataset = get_validation_dataset(self.cfg, val_path)
-        dataloader = DataLoader(
-            dataset,
-            batch_size=self.cfg.training.batch_size,
-            num_workers=self.cfg.training.num_workers,
-            pin_memory=True,
-        )
-        return dataloader
-    def _get_predict_dataloader(
-        self,
-        input: Union[np.ndarray, str, Path],
-        *,
-        tile_shape: Optional[List[int]] = None,
-        overlaps: Optional[List[int]] = None,
-        axes: Optional[str] = None,
-    ) -> Tuple[DataLoader, bool]:
-        """
-        Return a prediction dataloader.
-        Parameters
-        ----------
-        input : Union[np.ndarray, str, Path]
-            Input array or path to data.
-        tile_shape : Optional[List[int]], optional
-            2D or 3D shape of the tiles, by default None.
-        overlaps : Optional[List[int]], optional
-            2D or 3D overlaps between tiles, by default None.
-        axes : Optional[str], optional
-            Axes of the input array if different from the one in the configuration.
-        Returns
-        -------
-        Tuple[DataLoader, bool]
-            Tuple of prediction data loader, and whether the data is tiled.
-        Raises
-        ------
-        ValueError
-            If the configuration is None.
-        ValueError
-            If the mean or std are not specified in the configuration.
-        ValueError
-            If the input is None.
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined.")
-        if self.cfg.data.mean is None or self.cfg.data.std is None:
-            raise ValueError(
-                "Mean or std are not specified in the configuration, prediction cannot "
-                "be performed. Was the model trained?"
-            )
-        if input is None:
-            raise ValueError("Ccannot predict on None input.")
-        # Create dataset
-        if isinstance(input, np.ndarray):  # np.ndarray
-            # Check that the axes fit the input
-            img_axes = self.cfg.data.axes if axes is None else axes
-            # TODO are self.cfg.data.axes and axes compatible (same spatial dim)?
-            check_array_validity(input, img_axes)
-            # Check if tiling requested
-            tiled = tile_shape is not None and overlaps is not None
-            # Validate tiles and overlaps
-            if tiled:
-                raise NotImplementedError(
-                    "Tiling with in memory array is currently not implemented."
-                )
-                # check_tiling_validity(tile_shape, overlaps)
-            # Normalize input and cast to float32
-            normalized_input = normalize(
-                img=input, mean=self.cfg.data.mean, std=self.cfg.data.std
-            )
-            normalized_input = normalized_input.astype(np.float32)
-            # Create dataset
-            dataset = TensorDataset(torch.from_numpy(normalized_input))
-        elif isinstance(input, str) or isinstance(input, Path):  # path
-            # Create dataset
-            dataset = get_prediction_dataset(
-                self.cfg,
-                pred_path=input,
-                tile_shape=tile_shape,
-                overlaps=overlaps,
-                axes=axes,
-            )
-            tiled = (
-                hasattr(dataset, "patch_extraction_method")
-                and dataset.patch_extraction_method is not None
-            )
-        return (
-            DataLoader(
-                dataset,
-                batch_size=1,
-                num_workers=0,
-                pin_memory=True,
-            ),
-            tiled,
-        )
-    def _save_checkpoint(
-        self, epoch: int, losses: List[float], save_method: str
-    ) -> Path:
-        """
-        Save checkpoint.
-        Currently only supports saving using `save_method="state_dict"`.
-        Parameters
-        ----------
-        epoch : int
-            Last epoch.
-        losses : List[float]
-            List of losses.
-        save_method : str
-            Method to save the model. Currently only supports `state_dict`.
-        Returns
-        -------
-        Path
-            Path to the saved checkpoint.
-        Raises
-        ------
-        ValueError
-            If the configuration is None.
-        NotImplementedError
-            If the requested save method is not supported.
-        """
-        if self.cfg is None:
-            raise ValueError("Configuration is not defined.")
-        if epoch == 0 or losses[-1] == min(losses):
-            name = f"{self.cfg.experiment_name}_best.pth"
-        else:
-            name = f"{self.cfg.experiment_name}_latest.pth"
-        workdir = self.cfg.working_directory
-        workdir.mkdir(parents=True, exist_ok=True)
-        if save_method == "state_dict":
-            checkpoint = {
-                "epoch": epoch,
-                "model_state_dict": self.model.state_dict(),
-                "optimizer_state_dict": self.optimizer.state_dict(),
-                "scheduler_state_dict": self.lr_scheduler.state_dict(),
-                "grad_scaler_state_dict": self.scaler.state_dict(),
-                "loss": losses[-1],
-                "config": self.cfg.model_dump(),
-            }
-            torch.save(checkpoint, workdir / name)
-        else:
-            raise NotImplementedError("Invalid save method.")
-        return self.cfg.working_directory.absolute() / name
-    def __del__(self) -> None:
-        """Exit logger."""
-        if hasattr(self, "logger"):
-            for handler in self.logger.handlers:
-                if isinstance(handler, FileHandler):
-                    self.logger.removeHandler(handler)
-                    handler.close()
-    def _generate_rdf(self, model_specs: Optional[dict] = None) -> dict:
-        """
-        Generate rdf data for bioimage.io format export.
-        Parameters
-        ----------
-        model_specs : Optional[dict], optional
-            Custom specs if different than the default ones, by default None.
-        Returns
-        -------
-        dict
-            RDF specs.
-        Raises
-        ------
-        ValueError
-            If the mean or std are not specified in the configuration.
-        ValueError
-            If the configuration is not defined.
-        """
-        if self.cfg is not None:
-            if self.cfg.data.mean is None or self.cfg.data.std is None:
-                raise ValueError(
-                    "Mean or std are not specified in the configuration, export to "
-                    "bioimage.io format is not possible."
-                )
-            # set in/out axes from config
-            axes = self.cfg.data.axes.lower().replace("s", "")
-            if "c" not in axes:
-                axes = "c" + axes
-            if "b" not in axes:
-                axes = "b" + axes
-            # get in/out samples' files
-            test_inputs, test_outputs = self._get_sample_io_files(axes)
-            specs = get_default_model_specs(
-                "Noise2Void",
-                self.cfg.data.mean,
-                self.cfg.data.std,
-                self.cfg.algorithm.is_3D,
-            )
-            if model_specs is not None:
-                specs.update(model_specs)
-            specs.update(
-                {
-                    "architecture": "careamics.models.unet",
-                    "test_inputs": test_inputs,
-                    "test_outputs": test_outputs,
-                    "input_axes": [axes],
-                    "output_axes": [axes],
-                }
-            )
-            return specs
-        else:
-            raise ValueError("Configuration is not defined.")
-    def save_as_bioimage(
-        self, output_zip: Union[Path, str], model_specs: Optional[dict] = None
-    ) -> BioimageModel:
-        """
-        Export the current model to BioImage.io model zoo format.
-        Parameters
-        ----------
-        output_zip : Union[Path, str]
-            Where to save the model zip file.
-        model_specs : Optional[dict]
-            A dictionary with keys being the bioimage-core build_model parameters. If
-            None then it will be populated by the model default specs.
-        Returns
-        -------
-        BioimageModel
-            Bioimage.io model object.
-        Raises
-        ------
-        ValueError
-            If the configuration is not defined.
-        """
-        if self.cfg is not None:
-            # Generate specs
-            specs = self._generate_rdf(model_specs)
-            # Build model
-            raw_model = build_zip_model(
-                path=output_zip,
-                config=self.cfg,
-                model_specs=specs,
-            )
-            return raw_model
-        else:
-            raise ValueError("Configuration is not defined.")
-    def _get_sample_io_files(self, axes: str) -> Tuple[List[str], List[str]]:
-        """
-        Create numpy format for use as inputs and outputs in the bioimage.io archive.
-        Parameters
-        ----------
-        axes : str
-            Input and output axes.
-        Returns
-        -------
-        Tuple[List[str], List[str]]
-            Tuple of input and output file paths.
-        Raises
-        ------
-        ValueError
-            If the configuration is not defined.
-        """
-        # input:
-        if self.cfg is not None:
-            sample_input = np.random.randn(*self.cfg.training.patch_size)
-            # if there are more input axes (like channel, ...),
-            # then expand the sample dimensions.
-            len_diff = len(axes) - len(self.cfg.training.patch_size)
-            if len_diff > 0:
-                sample_input = np.expand_dims(
-                    sample_input, axis=tuple(i for i in range(len_diff))
-                )
-            sample_output = np.random.randn(*sample_input.shape)
-            # save numpy files
-            workdir = self.cfg.working_directory
-            in_file = workdir.joinpath("test_inputs.npy")
-            np.save(in_file, sample_input)
-            out_file = workdir.joinpath("test_outputs.npy")
-            np.save(out_file, sample_output)
-            return [str(in_file.absolute())], [str(out_file.absolute())]
-        else:
-            raise ValueError("Configuration is not defined.")

careamics 0.1.0rc1__py3-none-any.whl → 0.1.0rc3__py3-none-any.whl

Potentially problematic release.

careamics 0.1.0rc1py3-none-any.whl → 0.1.0rc3py3-none-any.whl