PyPI - careamics - Versions diffs - 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl - Mend

careamics 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of careamics might be problematic. Click here for more details.

Files changed (155) hide show

careamics/__init__.py +6 -1
careamics/careamist.py +729 -0
careamics/config/__init__.py +39 -0
careamics/config/architectures/__init__.py +17 -0
careamics/config/architectures/architecture_model.py +37 -0
careamics/config/architectures/custom_model.py +162 -0
careamics/config/architectures/lvae_model.py +174 -0
careamics/config/architectures/register_model.py +103 -0
careamics/config/architectures/unet_model.py +118 -0
careamics/config/callback_model.py +123 -0
careamics/config/configuration_factory.py +583 -0
careamics/config/configuration_model.py +604 -0
careamics/config/data_model.py +527 -0
careamics/config/fcn_algorithm_model.py +147 -0
careamics/config/inference_model.py +239 -0
careamics/config/likelihood_model.py +43 -0
careamics/config/nm_model.py +101 -0
careamics/config/optimizer_models.py +187 -0
careamics/config/references/__init__.py +45 -0
careamics/config/references/algorithm_descriptions.py +132 -0
careamics/config/references/references.py +39 -0
careamics/config/support/__init__.py +31 -0
careamics/config/support/supported_activations.py +27 -0
careamics/config/support/supported_algorithms.py +33 -0
careamics/config/support/supported_architectures.py +17 -0
careamics/config/support/supported_data.py +109 -0
careamics/config/support/supported_loggers.py +10 -0
careamics/config/support/supported_losses.py +29 -0
careamics/config/support/supported_optimizers.py +57 -0
careamics/config/support/supported_pixel_manipulations.py +15 -0
careamics/config/support/supported_struct_axis.py +21 -0
careamics/config/support/supported_transforms.py +11 -0
careamics/config/tile_information.py +65 -0
careamics/config/training_model.py +72 -0
careamics/config/transformations/__init__.py +15 -0
careamics/config/transformations/n2v_manipulate_model.py +64 -0
careamics/config/transformations/normalize_model.py +60 -0
careamics/config/transformations/transform_model.py +45 -0
careamics/config/transformations/xy_flip_model.py +43 -0
careamics/config/transformations/xy_random_rotate90_model.py +35 -0
careamics/config/vae_algorithm_model.py +171 -0
careamics/config/validators/__init__.py +5 -0
careamics/config/validators/validator_utils.py +101 -0
careamics/conftest.py +39 -0
careamics/dataset/__init__.py +17 -0
careamics/dataset/dataset_utils/__init__.py +19 -0
careamics/dataset/dataset_utils/dataset_utils.py +101 -0
careamics/dataset/dataset_utils/file_utils.py +141 -0
careamics/dataset/dataset_utils/iterate_over_files.py +83 -0
careamics/dataset/dataset_utils/running_stats.py +186 -0
careamics/dataset/in_memory_dataset.py +310 -0
careamics/dataset/in_memory_pred_dataset.py +88 -0
careamics/dataset/in_memory_tiled_pred_dataset.py +129 -0
careamics/dataset/iterable_dataset.py +295 -0
careamics/dataset/iterable_pred_dataset.py +122 -0
careamics/dataset/iterable_tiled_pred_dataset.py +140 -0
careamics/dataset/patching/__init__.py +1 -0
careamics/dataset/patching/patching.py +299 -0
careamics/dataset/patching/random_patching.py +201 -0
careamics/dataset/patching/sequential_patching.py +212 -0
careamics/dataset/patching/validate_patch_dimension.py +64 -0
careamics/dataset/tiling/__init__.py +10 -0
careamics/dataset/tiling/collate_tiles.py +33 -0
careamics/dataset/tiling/lvae_tiled_patching.py +282 -0
careamics/dataset/tiling/tiled_patching.py +164 -0
careamics/dataset/zarr_dataset.py +151 -0
careamics/file_io/__init__.py +15 -0
careamics/file_io/read/__init__.py +12 -0
careamics/file_io/read/get_func.py +56 -0
careamics/file_io/read/tiff.py +58 -0
careamics/file_io/read/zarr.py +60 -0
careamics/file_io/write/__init__.py +15 -0
careamics/file_io/write/get_func.py +63 -0
careamics/file_io/write/tiff.py +40 -0
careamics/lightning/__init__.py +18 -0
careamics/lightning/callbacks/__init__.py +11 -0
careamics/lightning/callbacks/hyperparameters_callback.py +49 -0
careamics/lightning/callbacks/prediction_writer_callback/__init__.py +20 -0
careamics/lightning/callbacks/prediction_writer_callback/file_path_utils.py +56 -0
careamics/lightning/callbacks/prediction_writer_callback/prediction_writer_callback.py +233 -0
careamics/lightning/callbacks/prediction_writer_callback/write_strategy.py +398 -0
careamics/lightning/callbacks/prediction_writer_callback/write_strategy_factory.py +215 -0
careamics/lightning/callbacks/progress_bar_callback.py +90 -0
careamics/lightning/lightning_module.py +632 -0
careamics/lightning/predict_data_module.py +333 -0
careamics/lightning/train_data_module.py +680 -0
careamics/losses/__init__.py +15 -0
careamics/losses/fcn/__init__.py +1 -0
careamics/losses/fcn/losses.py +98 -0
careamics/losses/loss_factory.py +155 -0
careamics/losses/lvae/__init__.py +1 -0
careamics/losses/lvae/loss_utils.py +83 -0
careamics/losses/lvae/losses.py +445 -0
careamics/lvae_training/__init__.py +0 -0
careamics/lvae_training/dataset/__init__.py +0 -0
careamics/lvae_training/dataset/data_utils.py +701 -0
careamics/lvae_training/dataset/lc_dataset.py +259 -0
careamics/lvae_training/dataset/lc_dataset_config.py +13 -0
careamics/lvae_training/dataset/vae_data_config.py +179 -0
careamics/lvae_training/dataset/vae_dataset.py +1054 -0
careamics/lvae_training/eval_utils.py +905 -0
careamics/lvae_training/get_config.py +84 -0
careamics/lvae_training/lightning_module.py +701 -0
careamics/lvae_training/metrics.py +214 -0
careamics/lvae_training/train_lvae.py +342 -0
careamics/lvae_training/train_utils.py +121 -0
careamics/model_io/__init__.py +7 -0
careamics/model_io/bioimage/__init__.py +11 -0
careamics/model_io/bioimage/_readme_factory.py +121 -0
careamics/model_io/bioimage/bioimage_utils.py +52 -0
careamics/model_io/bioimage/model_description.py +327 -0
careamics/model_io/bmz_io.py +246 -0
careamics/model_io/model_io_utils.py +95 -0
careamics/models/__init__.py +5 -0
careamics/models/activation.py +39 -0
careamics/models/layers.py +493 -0
careamics/models/lvae/__init__.py +3 -0
careamics/models/lvae/layers.py +1998 -0
careamics/models/lvae/likelihoods.py +364 -0
careamics/models/lvae/lvae.py +901 -0
careamics/models/lvae/noise_models.py +541 -0
careamics/models/lvae/utils.py +395 -0
careamics/models/model_factory.py +67 -0
careamics/models/unet.py +443 -0
careamics/prediction_utils/__init__.py +10 -0
careamics/prediction_utils/lvae_prediction.py +158 -0
careamics/prediction_utils/lvae_tiling_manager.py +362 -0
careamics/prediction_utils/prediction_outputs.py +135 -0
careamics/prediction_utils/stitch_prediction.py +112 -0
careamics/transforms/__init__.py +20 -0
careamics/transforms/compose.py +107 -0
careamics/transforms/n2v_manipulate.py +146 -0
careamics/transforms/normalize.py +243 -0
careamics/transforms/pixel_manipulation.py +407 -0
careamics/transforms/struct_mask_parameters.py +20 -0
careamics/transforms/transform.py +24 -0
careamics/transforms/tta.py +88 -0
careamics/transforms/xy_flip.py +123 -0
careamics/transforms/xy_random_rotate90.py +101 -0
careamics/utils/__init__.py +19 -0
careamics/utils/autocorrelation.py +40 -0
careamics/utils/base_enum.py +60 -0
careamics/utils/context.py +66 -0
careamics/utils/logging.py +322 -0
careamics/utils/metrics.py +188 -0
careamics/utils/path_utils.py +26 -0
careamics/utils/ram.py +15 -0
careamics/utils/receptive_field.py +108 -0
careamics/utils/torch_utils.py +127 -0
careamics-0.0.3.dist-info/METADATA +78 -0
careamics-0.0.3.dist-info/RECORD +154 -0
{careamics-0.0.1.dist-info → careamics-0.0.3.dist-info}/WHEEL +1 -1
{careamics-0.0.1.dist-info → careamics-0.0.3.dist-info}/licenses/LICENSE +1 -1
careamics-0.0.1.dist-info/METADATA +0 -46
careamics-0.0.1.dist-info/RECORD +0 -6

careamics/careamist.py ADDED Viewed

@@ -0,0 +1,729 @@
+"""A class to train, predict and export models in CAREamics."""
+from pathlib import Path
+from typing import Any, Callable, Literal, Optional, Union, overload
+import numpy as np
+from numpy.typing import NDArray
+from pytorch_lightning import Trainer
+from pytorch_lightning.callbacks import (
+    Callback,
+    EarlyStopping,
+    ModelCheckpoint,
+)
+from pytorch_lightning.loggers import TensorBoardLogger, WandbLogger
+from careamics.config import Configuration, FCNAlgorithmConfig, load_configuration
+from careamics.config.support import (
+    SupportedAlgorithm,
+    SupportedArchitecture,
+    SupportedData,
+    SupportedLogger,
+)
+from careamics.dataset.dataset_utils import reshape_array
+from careamics.lightning import (
+    FCNModule,
+    HyperParametersCallback,
+    PredictDataModule,
+    ProgressBarCallback,
+    TrainDataModule,
+    create_predict_datamodule,
+)
+from careamics.model_io import export_to_bmz, load_pretrained
+from careamics.prediction_utils import convert_outputs
+from careamics.utils import check_path_exists, get_logger
+logger = get_logger(__name__)
+LOGGER_TYPES = Optional[Union[TensorBoardLogger, WandbLogger]]
+class CAREamist:
+    """Main CAREamics class, allowing training and prediction using various algorithms.
+    Parameters
+    ----------
+    source : pathlib.Path or str or CAREamics Configuration
+        Path to a configuration file or a trained model.
+    work_dir : str, optional
+        Path to working directory in which to save checkpoints and logs,
+        by default None.
+    experiment_name : str, by default "CAREamics"
+        Experiment name used for checkpoints.
+    callbacks : list of Callback, optional
+        List of callbacks to use during training and prediction, by default None.
+    Attributes
+    ----------
+    model : CAREamicsModule
+        CAREamics model.
+    cfg : Configuration
+        CAREamics configuration.
+    trainer : Trainer
+        PyTorch Lightning trainer.
+    experiment_logger : TensorBoardLogger or WandbLogger
+        Experiment logger, "wandb" or "tensorboard".
+    work_dir : pathlib.Path
+        Working directory.
+    train_datamodule : TrainDataModule
+        Training datamodule.
+    pred_datamodule : PredictDataModule
+        Prediction datamodule.
+    """
+    @overload
+    def __init__(  # numpydoc ignore=GL08
+        self,
+        source: Union[Path, str],
+        work_dir: Optional[str] = None,
+        experiment_name: str = "CAREamics",
+        callbacks: Optional[list[Callback]] = None,
+    ) -> None: ...
+    @overload
+    def __init__(  # numpydoc ignore=GL08
+        self,
+        source: Configuration,
+        work_dir: Optional[str] = None,
+        experiment_name: str = "CAREamics",
+        callbacks: Optional[list[Callback]] = None,
+    ) -> None: ...
+    def __init__(
+        self,
+        source: Union[Path, str, Configuration],
+        work_dir: Optional[Union[Path, str]] = None,
+        experiment_name: str = "CAREamics",
+        callbacks: Optional[list[Callback]] = None,
+    ) -> None:
+        """
+        Initialize CAREamist with a configuration object or a path.
+        A configuration object can be created using directly by calling `Configuration`,
+        using the configuration factory or loading a configuration from a yaml file.
+        Path can contain either a yaml file with parameters, or a saved checkpoint.
+        If no working directory is provided, the current working directory is used.
+        If `source` is a checkpoint, then `experiment_name` is used to name the
+        checkpoint, and is recorded in the configuration.
+        Parameters
+        ----------
+        source : pathlib.Path or str or CAREamics Configuration
+            Path to a configuration file or a trained model.
+        work_dir : str, optional
+            Path to working directory in which to save checkpoints and logs,
+            by default None.
+        experiment_name : str, optional
+            Experiment name used for checkpoints, by default "CAREamics".
+        callbacks : list of Callback, optional
+            List of callbacks to use during training and prediction, by default None.
+        Raises
+        ------
+        NotImplementedError
+            If the model is loaded from BioImage Model Zoo.
+        ValueError
+            If no hyper parameters are found in the checkpoint.
+        ValueError
+            If no data module hyper parameters are found in the checkpoint.
+        """
+        # select current working directory if work_dir is None
+        if work_dir is None:
+            self.work_dir = Path.cwd()
+            logger.warning(
+                f"No working directory provided. Using current working directory: "
+                f"{self.work_dir}."
+            )
+        else:
+            self.work_dir = Path(work_dir)
+        # configuration object
+        if isinstance(source, Configuration):
+            self.cfg = source
+            # instantiate model
+            if isinstance(self.cfg.algorithm_config, FCNAlgorithmConfig):
+                self.model = FCNModule(
+                    algorithm_config=self.cfg.algorithm_config,
+                )
+            else:
+                raise NotImplementedError("Architecture not supported.")
+        # path to configuration file or model
+        else:
+            source = check_path_exists(source)
+            # configuration file
+            if source.is_file() and (
+                source.suffix == ".yaml" or source.suffix == ".yml"
+            ):
+                # load configuration
+                self.cfg = load_configuration(source)
+                # instantiate model
+                if isinstance(self.cfg.algorithm_config, FCNAlgorithmConfig):
+                    self.model = FCNModule(
+                        algorithm_config=self.cfg.algorithm_config,
+                    )  # type: ignore
+                else:
+                    raise NotImplementedError("Architecture not supported.")
+            # attempt loading a pre-trained model
+            else:
+                self.model, self.cfg = load_pretrained(source)
+        # define the checkpoint saving callback
+        self._define_callbacks(callbacks)
+        # instantiate logger
+        if self.cfg.training_config.has_logger():
+            if self.cfg.training_config.logger == SupportedLogger.WANDB:
+                self.experiment_logger: LOGGER_TYPES = WandbLogger(
+                    name=self.cfg.experiment_name,
+                    save_dir=self.work_dir / Path("logs"),
+                )
+            elif self.cfg.training_config.logger == SupportedLogger.TENSORBOARD:
+                self.experiment_logger = TensorBoardLogger(
+                    save_dir=self.work_dir / Path("logs"),
+                )
+        else:
+            self.experiment_logger = None
+        # instantiate trainer
+        self.trainer = Trainer(
+            max_epochs=self.cfg.training_config.num_epochs,
+            callbacks=self.callbacks,
+            default_root_dir=self.work_dir,
+            logger=self.experiment_logger,
+        )
+        # place holder for the datamodules
+        self.train_datamodule: Optional[TrainDataModule] = None
+        self.pred_datamodule: Optional[PredictDataModule] = None
+    def _define_callbacks(self, callbacks: Optional[list[Callback]] = None) -> None:
+        """Define the callbacks for the training loop.
+        Parameters
+        ----------
+        callbacks : list of Callback, optional
+            List of callbacks to use during training and prediction, by default None.
+        """
+        self.callbacks = [] if callbacks is None else callbacks
+        # check that user callbacks are not any of the CAREamics callbacks
+        for c in self.callbacks:
+            if isinstance(c, ModelCheckpoint) or isinstance(c, EarlyStopping):
+                raise ValueError(
+                    "ModelCheckpoint and EarlyStopping callbacks are already defined "
+                    "in CAREamics and should only be modified through the "
+                    "training configuration (see TrainingConfig)."
+                )
+            if isinstance(c, HyperParametersCallback) or isinstance(
+                c, ProgressBarCallback
+            ):
+                raise ValueError(
+                    "HyperParameter and ProgressBar callbacks are defined internally "
+                    "and should not be passed as callbacks."
+                )
+        # checkpoint callback saves checkpoints during training
+        self.callbacks.extend(
+            [
+                HyperParametersCallback(self.cfg),
+                ModelCheckpoint(
+                    dirpath=self.work_dir / Path("checkpoints"),
+                    filename=self.cfg.experiment_name,
+                    **self.cfg.training_config.checkpoint_callback.model_dump(),
+                ),
+                ProgressBarCallback(),
+            ]
+        )
+        # early stopping callback
+        if self.cfg.training_config.early_stopping_callback is not None:
+            self.callbacks.append(
+                EarlyStopping(self.cfg.training_config.early_stopping_callback)
+            )
+    # TODO: is there are more elegant way than calling train again after _train_on_paths
+    def train(
+        self,
+        *,
+        datamodule: Optional[TrainDataModule] = None,
+        train_source: Optional[Union[Path, str, NDArray]] = None,
+        val_source: Optional[Union[Path, str, NDArray]] = None,
+        train_target: Optional[Union[Path, str, NDArray]] = None,
+        val_target: Optional[Union[Path, str, NDArray]] = None,
+        use_in_memory: bool = True,
+        val_percentage: float = 0.1,
+        val_minimum_split: int = 1,
+    ) -> None:
+        """
+        Train the model on the provided data.
+        If a datamodule is provided, then training will be performed using it.
+        Alternatively, the training data can be provided as arrays or paths.
+        If `use_in_memory` is set to True, the source provided as Path or str will be
+        loaded in memory if it fits. Otherwise, training will be performed by loading
+        patches from the files one by one. Training on arrays is always performed
+        in memory.
+        If no validation source is provided, then the validation is extracted from
+        the training data using `val_percentage` and `val_minimum_split`. In the case
+        of data provided as Path or str, the percentage and minimum number are applied
+        to the number of files. For arrays, it is the number of patches.
+        Parameters
+        ----------
+        datamodule : TrainDataModule, optional
+            Datamodule to train on, by default None.
+        train_source : pathlib.Path or str or NDArray, optional
+            Train source, if no datamodule is provided, by default None.
+        val_source : pathlib.Path or str or NDArray, optional
+            Validation source, if no datamodule is provided, by default None.
+        train_target : pathlib.Path or str or NDArray, optional
+            Train target source, if no datamodule is provided, by default None.
+        val_target : pathlib.Path or str or NDArray, optional
+            Validation target source, if no datamodule is provided, by default None.
+        use_in_memory : bool, optional
+            Use in memory dataset if possible, by default True.
+        val_percentage : float, optional
+            Percentage of validation extracted from training data, by default 0.1.
+        val_minimum_split : int, optional
+            Minimum number of validation (patch or file) extracted from training data,
+            by default 1.
+        Raises
+        ------
+        ValueError
+            If both `datamodule` and `train_source` are provided.
+        ValueError
+            If sources are not of the same type (e.g. train is an array and val is
+            a Path).
+        ValueError
+            If the training target is provided to N2V.
+        ValueError
+            If neither a datamodule nor a source is provided.
+        """
+        if datamodule is not None and train_source is not None:
+            raise ValueError(
+                "Only one of `datamodule` and `train_source` can be provided."
+            )
+        # check that inputs are the same type
+        source_types = {
+            type(s)
+            for s in (train_source, val_source, train_target, val_target)
+            if s is not None
+        }
+        if len(source_types) > 1:
+            raise ValueError("All sources should be of the same type.")
+        # train
+        if datamodule is not None:
+            self._train_on_datamodule(datamodule=datamodule)
+        else:
+            # raise error if target is provided to N2V
+            if self.cfg.algorithm_config.algorithm == SupportedAlgorithm.N2V.value:
+                if train_target is not None:
+                    raise ValueError(
+                        "Training target not compatible with N2V training."
+                    )
+            # dispatch the training
+            if isinstance(train_source, np.ndarray):
+                # mypy checks
+                assert isinstance(val_source, np.ndarray) or val_source is None
+                assert isinstance(train_target, np.ndarray) or train_target is None
+                assert isinstance(val_target, np.ndarray) or val_target is None
+                self._train_on_array(
+                    train_source,
+                    val_source,
+                    train_target,
+                    val_target,
+                    val_percentage,
+                    val_minimum_split,
+                )
+            elif isinstance(train_source, Path) or isinstance(train_source, str):
+                # mypy checks
+                assert (
+                    isinstance(val_source, Path)
+                    or isinstance(val_source, str)
+                    or val_source is None
+                )
+                assert (
+                    isinstance(train_target, Path)
+                    or isinstance(train_target, str)
+                    or train_target is None
+                )
+                assert (
+                    isinstance(val_target, Path)
+                    or isinstance(val_target, str)
+                    or val_target is None
+                )
+                self._train_on_path(
+                    train_source,
+                    val_source,
+                    train_target,
+                    val_target,
+                    use_in_memory,
+                    val_percentage,
+                    val_minimum_split,
+                )
+            else:
+                raise ValueError(
+                    f"Invalid input, expected a str, Path, array or TrainDataModule "
+                    f"instance (got {type(train_source)})."
+                )
+    def _train_on_datamodule(self, datamodule: TrainDataModule) -> None:
+        """
+        Train the model on the provided datamodule.
+        Parameters
+        ----------
+        datamodule : TrainDataModule
+            Datamodule to train on.
+        """
+        # record datamodule
+        self.train_datamodule = datamodule
+        self.trainer.fit(self.model, datamodule=datamodule)
+    def _train_on_array(
+        self,
+        train_data: NDArray,
+        val_data: Optional[NDArray] = None,
+        train_target: Optional[NDArray] = None,
+        val_target: Optional[NDArray] = None,
+        val_percentage: float = 0.1,
+        val_minimum_split: int = 5,
+    ) -> None:
+        """
+        Train the model on the provided data arrays.
+        Parameters
+        ----------
+        train_data : NDArray
+            Training data.
+        val_data : NDArray, optional
+            Validation data, by default None.
+        train_target : NDArray, optional
+            Train target data, by default None.
+        val_target : NDArray, optional
+            Validation target data, by default None.
+        val_percentage : float, optional
+            Percentage of patches to use for validation, by default 0.1.
+        val_minimum_split : int, optional
+            Minimum number of patches to use for validation, by default 5.
+        """
+        # create datamodule
+        datamodule = TrainDataModule(
+            data_config=self.cfg.data_config,
+            train_data=train_data,
+            val_data=val_data,
+            train_data_target=train_target,
+            val_data_target=val_target,
+            val_percentage=val_percentage,
+            val_minimum_split=val_minimum_split,
+        )
+        # train
+        self.train(datamodule=datamodule)
+    def _train_on_path(
+        self,
+        path_to_train_data: Union[Path, str],
+        path_to_val_data: Optional[Union[Path, str]] = None,
+        path_to_train_target: Optional[Union[Path, str]] = None,
+        path_to_val_target: Optional[Union[Path, str]] = None,
+        use_in_memory: bool = True,
+        val_percentage: float = 0.1,
+        val_minimum_split: int = 1,
+    ) -> None:
+        """
+        Train the model on the provided data paths.
+        Parameters
+        ----------
+        path_to_train_data : pathlib.Path or str
+            Path to the training data.
+        path_to_val_data : pathlib.Path or str, optional
+            Path to validation data, by default None.
+        path_to_train_target : pathlib.Path or str, optional
+            Path to train target data, by default None.
+        path_to_val_target : pathlib.Path or str, optional
+            Path to validation target data, by default None.
+        use_in_memory : bool, optional
+            Use in memory dataset if possible, by default True.
+        val_percentage : float, optional
+            Percentage of files to use for validation, by default 0.1.
+        val_minimum_split : int, optional
+            Minimum number of files to use for validation, by default 1.
+        """
+        # sanity check on data (path exists)
+        path_to_train_data = check_path_exists(path_to_train_data)
+        if path_to_val_data is not None:
+            path_to_val_data = check_path_exists(path_to_val_data)
+        if path_to_train_target is not None:
+            path_to_train_target = check_path_exists(path_to_train_target)
+        if path_to_val_target is not None:
+            path_to_val_target = check_path_exists(path_to_val_target)
+        # create datamodule
+        datamodule = TrainDataModule(
+            data_config=self.cfg.data_config,
+            train_data=path_to_train_data,
+            val_data=path_to_val_data,
+            train_data_target=path_to_train_target,
+            val_data_target=path_to_val_target,
+            use_in_memory=use_in_memory,
+            val_percentage=val_percentage,
+            val_minimum_split=val_minimum_split,
+        )
+        # train
+        self.train(datamodule=datamodule)
+    @overload
+    def predict(  # numpydoc ignore=GL08
+        self, source: PredictDataModule
+    ) -> Union[list[NDArray], NDArray]: ...
+    @overload
+    def predict(  # numpydoc ignore=GL08
+        self,
+        source: Union[Path, str],
+        *,
+        batch_size: int = 1,
+        tile_size: Optional[tuple[int, ...]] = None,
+        tile_overlap: tuple[int, ...] = (48, 48),
+        axes: Optional[str] = None,
+        data_type: Optional[Literal["tiff", "custom"]] = None,
+        tta_transforms: bool = True,
+        dataloader_params: Optional[dict] = None,
+        read_source_func: Optional[Callable] = None,
+        extension_filter: str = "",
+    ) -> Union[list[NDArray], NDArray]: ...
+    @overload
+    def predict(  # numpydoc ignore=GL08
+        self,
+        source: NDArray,
+        *,
+        batch_size: int = 1,
+        tile_size: Optional[tuple[int, ...]] = None,
+        tile_overlap: tuple[int, ...] = (48, 48),
+        axes: Optional[str] = None,
+        data_type: Optional[Literal["array"]] = None,
+        tta_transforms: bool = True,
+        dataloader_params: Optional[dict] = None,
+    ) -> Union[list[NDArray], NDArray]: ...
+    def predict(
+        self,
+        source: Union[PredictDataModule, Path, str, NDArray],
+        *,
+        batch_size: Optional[int] = None,
+        tile_size: Optional[tuple[int, ...]] = None,
+        tile_overlap: Optional[tuple[int, ...]] = (48, 48),
+        axes: Optional[str] = None,
+        data_type: Optional[Literal["array", "tiff", "custom"]] = None,
+        tta_transforms: bool = True,
+        dataloader_params: Optional[dict] = None,
+        read_source_func: Optional[Callable] = None,
+        extension_filter: str = "",
+        **kwargs: Any,
+    ) -> Union[list[NDArray], NDArray]:
+        """
+        Make predictions on the provided data.
+        Input can be a CAREamicsPredData instance, a path to a data file, or a numpy
+        array.
+        If `data_type`, `axes` and `tile_size` are not provided, the training
+        configuration parameters will be used, with the `patch_size` instead of
+        `tile_size`.
+        Test-time augmentation (TTA) can be switched off using the `tta_transforms`
+        parameter. The TTA augmentation applies all possible flip and 90 degrees
+        rotations to the prediction input and averages the predictions. TTA augmentation
+        should not be used if you did not train with these augmentations.
+        Note that if you are using a UNet model and tiling, the tile size must be
+        divisible in every dimension by 2**d, where d is the depth of the model. This
+        avoids artefacts arising from the broken shift invariance induced by the
+        pooling layers of the UNet. If your image has less dimensions, as it may
+        happen in the Z dimension, consider padding your image.
+        Parameters
+        ----------
+        source : CAREamicsPredData, pathlib.Path, str or numpy.ndarray
+            Data to predict on.
+        batch_size : int, default=1
+            Batch size for prediction.
+        tile_size : tuple of int, optional
+            Size of the tiles to use for prediction.
+        tile_overlap : tuple of int, default=(48, 48)
+            Overlap between tiles, can be None.
+        axes : str, optional
+            Axes of the input data, by default None.
+        data_type : {"array", "tiff", "custom"}, optional
+            Type of the input data.
+        tta_transforms : bool, default=True
+            Whether to apply test-time augmentation.
+        dataloader_params : dict, optional
+            Parameters to pass to the dataloader.
+        read_source_func : Callable, optional
+            Function to read the source data.
+        extension_filter : str, default=""
+            Filter for the file extension.
+        **kwargs : Any
+            Unused.
+        Returns
+        -------
+        list of NDArray or NDArray
+            Predictions made by the model.
+        Raises
+        ------
+        ValueError
+            If mean and std are not provided in the configuration.
+        ValueError
+            If tile size is not divisible by 2**depth for UNet models.
+        ValueError
+            If tile overlap is not specified.
+        """
+        if (
+            self.cfg.data_config.image_means is None
+            or self.cfg.data_config.image_stds is None
+        ):
+            raise ValueError("Mean and std must be provided in the configuration.")
+        # tile size for UNets
+        if tile_size is not None:
+            model = self.cfg.algorithm_config.model
+            if model.architecture == SupportedArchitecture.UNET.value:
+                # tile size must be equal to k*2^n, where n is the number of pooling
+                # layers (equal to the depth) and k is an integer
+                depth = model.depth
+                tile_increment = 2**depth
+                for i, t in enumerate(tile_size):
+                    if t % tile_increment != 0:
+                        raise ValueError(
+                            f"Tile size must be divisible by {tile_increment} along "
+                            f"all axes (got {t} for axis {i}). If your image size is "
+                            f"smaller along one axis (e.g. Z), consider padding the "
+                            f"image."
+                        )
+            # tile overlaps must be specified
+            if tile_overlap is None:
+                raise ValueError("Tile overlap must be specified.")
+        # create the prediction
+        self.pred_datamodule = create_predict_datamodule(
+            pred_data=source,
+            data_type=data_type or self.cfg.data_config.data_type,
+            axes=axes or self.cfg.data_config.axes,
+            image_means=self.cfg.data_config.image_means,
+            image_stds=self.cfg.data_config.image_stds,
+            tile_size=tile_size,
+            tile_overlap=tile_overlap,
+            batch_size=batch_size or self.cfg.data_config.batch_size,
+            tta_transforms=tta_transforms,
+            read_source_func=read_source_func,
+            extension_filter=extension_filter,
+            dataloader_params=dataloader_params,
+        )
+        # predict
+        predictions = self.trainer.predict(
+            model=self.model, datamodule=self.pred_datamodule
+        )
+        return convert_outputs(predictions, self.pred_datamodule.tiled)
+    def export_to_bmz(
+        self,
+        path_to_archive: Union[Path, str],
+        friendly_model_name: str,
+        input_array: NDArray,
+        authors: list[dict],
+        general_description: str = "",
+        channel_names: Optional[list[str]] = None,
+        data_description: Optional[str] = None,
+    ) -> None:
+        """Export the model to the BioImage Model Zoo format.
+        This method packages the current weights into a zip file that can be uploaded
+        to the BioImage Model Zoo. The archive consists of the model weights, the model
+        specifications and various files (inputs, outputs, README, env.yaml etc.).
+        `path_to_archive` should point to a file with a ".zip" extension.
+        `friendly_model_name` is the name used for the model in the BMZ specs
+        and website, it should consist of letters, numbers, dashes, underscores and
+        parentheses only.
+        Input array must be of the same dimensions as the axes recorded in the
+        configuration of the `CAREamist`.
+        Parameters
+        ----------
+        path_to_archive : pathlib.Path or str
+            Path in which to save the model, including file name, which should end with
+            ".zip".
+        friendly_model_name : str
+            Name of the model as used in the BMZ specs, it should consist of letters,
+            numbers, dashes, underscores and parentheses only.
+        input_array : NDArray
+            Input array used to validate the model and as example.
+        authors : list of dict
+            List of authors of the model.
+        general_description : str
+            General description of the model, used in the metadata of the BMZ archive.
+        channel_names : list of str, optional
+            Channel names, by default None.
+        data_description : str, optional
+            Description of the data, by default None.
+        """
+        # TODO: add in docs that it is expected that input_array dimensions match
+        # those in data_config
+        output_patch = self.predict(
+            input_array,
+            data_type=SupportedData.ARRAY.value,
+            tta_transforms=False,
+        )
+        output = np.concatenate(output_patch, axis=0)
+        input_array = reshape_array(input_array, self.cfg.data_config.axes)
+        export_to_bmz(
+            model=self.model,
+            config=self.cfg,
+            path_to_archive=path_to_archive,
+            model_name=friendly_model_name,
+            general_description=general_description,
+            authors=authors,
+            input_array=input_array,
+            output_array=output,
+            channel_names=channel_names,
+            data_description=data_description,
+        )

careamics 0.0.1__py3-none-any.whl → 0.0.3__py3-none-any.whl

Potentially problematic release.

careamics 0.0.1py3-none-any.whl → 0.0.3py3-none-any.whl