PyPI - careamics - Versions diffs - 0.0.4.2__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

careamics 0.0.4.2py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of careamics might be problematic. Click here for more details.

Files changed (118) hide show

careamics/__init__.py +17 -2
careamics/careamist.py +239 -28
careamics/cli/conf.py +19 -31
careamics/cli/main.py +112 -12
careamics/cli/utils.py +29 -0
careamics/config/__init__.py +48 -24
careamics/config/algorithms/__init__.py +15 -0
careamics/config/algorithms/care_algorithm_model.py +50 -0
careamics/config/algorithms/n2n_algorithm_model.py +42 -0
careamics/config/algorithms/n2v_algorithm_model.py +35 -0
careamics/config/algorithms/unet_algorithm_model.py +88 -0
careamics/config/{vae_algorithm_model.py → algorithms/vae_algorithm_model.py} +26 -23
careamics/config/architectures/__init__.py +1 -11
careamics/config/architectures/architecture_model.py +3 -3
careamics/config/architectures/lvae_model.py +109 -21
careamics/config/architectures/unet_model.py +1 -0
careamics/config/care_configuration.py +100 -0
careamics/config/configuration.py +354 -0
careamics/config/{configuration_factory.py → configuration_factories.py} +152 -81
careamics/config/configuration_io.py +85 -0
careamics/config/data/__init__.py +10 -0
careamics/config/{data_model.py → data/data_model.py} +58 -198
careamics/config/data/n2v_data_model.py +193 -0
careamics/config/likelihood_model.py +8 -8
careamics/config/loss_model.py +56 -0
careamics/config/n2n_configuration.py +101 -0
careamics/config/n2v_configuration.py +266 -0
careamics/config/nm_model.py +24 -25
careamics/config/support/__init__.py +7 -7
careamics/config/support/supported_algorithms.py +0 -3
careamics/config/support/supported_architectures.py +0 -4
careamics/config/transformations/__init__.py +10 -4
careamics/config/transformations/transform_model.py +3 -3
careamics/config/transformations/transform_unions.py +42 -0
careamics/config/validators/validator_utils.py +3 -3
careamics/dataset/__init__.py +2 -2
careamics/dataset/dataset_utils/__init__.py +3 -3
careamics/dataset/dataset_utils/dataset_utils.py +4 -6
careamics/dataset/dataset_utils/file_utils.py +9 -9
careamics/dataset/dataset_utils/iterate_over_files.py +4 -3
careamics/dataset/dataset_utils/running_stats.py +22 -23
careamics/dataset/in_memory_dataset.py +11 -12
careamics/dataset/iterable_dataset.py +4 -4
careamics/dataset/iterable_pred_dataset.py +2 -1
careamics/dataset/iterable_tiled_pred_dataset.py +2 -1
careamics/dataset/patching/random_patching.py +11 -10
careamics/dataset/patching/sequential_patching.py +26 -26
careamics/dataset/patching/validate_patch_dimension.py +3 -3
careamics/dataset/tiling/__init__.py +2 -2
careamics/dataset/tiling/collate_tiles.py +3 -3
careamics/dataset/tiling/lvae_tiled_patching.py +2 -1
careamics/dataset/tiling/tiled_patching.py +11 -10
careamics/file_io/__init__.py +5 -5
careamics/file_io/read/__init__.py +1 -1
careamics/file_io/read/get_func.py +2 -2
careamics/file_io/write/__init__.py +2 -2
careamics/lightning/__init__.py +5 -5
careamics/lightning/callbacks/__init__.py +1 -1
careamics/lightning/callbacks/prediction_writer_callback/__init__.py +3 -3
careamics/lightning/callbacks/prediction_writer_callback/prediction_writer_callback.py +2 -1
careamics/lightning/callbacks/prediction_writer_callback/write_strategy.py +2 -1
careamics/lightning/callbacks/progress_bar_callback.py +2 -2
careamics/lightning/lightning_module.py +69 -34
careamics/lightning/train_data_module.py +41 -27
careamics/losses/__init__.py +3 -3
careamics/losses/loss_factory.py +1 -85
careamics/losses/lvae/losses.py +223 -164
careamics/lvae_training/calibration.py +184 -0
careamics/lvae_training/dataset/config.py +2 -2
careamics/lvae_training/dataset/multich_dataset.py +11 -19
careamics/lvae_training/dataset/multifile_dataset.py +3 -2
careamics/lvae_training/dataset/types.py +15 -26
careamics/lvae_training/dataset/utils/index_manager.py +4 -4
careamics/lvae_training/eval_utils.py +125 -213
careamics/model_io/__init__.py +1 -1
careamics/model_io/bioimage/__init__.py +1 -1
careamics/model_io/bioimage/_readme_factory.py +26 -34
careamics/model_io/bioimage/cover_factory.py +171 -0
careamics/model_io/bioimage/model_description.py +56 -34
careamics/model_io/bmz_io.py +42 -42
careamics/model_io/model_io_utils.py +9 -9
careamics/models/layers.py +22 -20
careamics/models/lvae/layers.py +348 -975
careamics/models/lvae/likelihoods.py +10 -8
careamics/models/lvae/lvae.py +214 -275
careamics/models/lvae/noise_models.py +179 -112
careamics/models/lvae/stochastic.py +393 -0
careamics/models/lvae/utils.py +82 -73
careamics/models/model_factory.py +2 -15
careamics/models/unet.py +8 -8
careamics/prediction_utils/__init__.py +1 -1
careamics/prediction_utils/prediction_outputs.py +15 -15
careamics/prediction_utils/stitch_prediction.py +6 -6
careamics/transforms/__init__.py +5 -5
careamics/transforms/compose.py +13 -13
careamics/transforms/n2v_manipulate.py +3 -3
careamics/transforms/pixel_manipulation.py +9 -9
careamics/transforms/xy_random_rotate90.py +4 -4
careamics/utils/__init__.py +5 -5
careamics/utils/context.py +2 -1
careamics/utils/lightning_utils.py +57 -0
careamics/utils/logging.py +11 -10
careamics/utils/serializers.py +2 -0
careamics/utils/torch_utils.py +8 -8
{careamics-0.0.4.2.dist-info → careamics-0.0.6.dist-info}/METADATA +16 -13
careamics-0.0.6.dist-info/RECORD +176 -0
{careamics-0.0.4.2.dist-info → careamics-0.0.6.dist-info}/WHEEL +1 -1
careamics/config/architectures/custom_model.py +0 -162
careamics/config/architectures/register_model.py +0 -103
careamics/config/configuration_model.py +0 -603
careamics/config/fcn_algorithm_model.py +0 -152
careamics/config/references/__init__.py +0 -45
careamics/config/references/algorithm_descriptions.py +0 -132
careamics/config/references/references.py +0 -39
careamics/config/transformations/transform_union.py +0 -20
careamics-0.0.4.2.dist-info/RECORD +0 -165
{careamics-0.0.4.2.dist-info → careamics-0.0.6.dist-info}/entry_points.txt +0 -0
{careamics-0.0.4.2.dist-info → careamics-0.0.6.dist-info}/licenses/LICENSE +0 -0

careamics/losses/lvae/losses.py CHANGED Viewed

@@ -2,7 +2,7 @@
 from __future__ import annotations
-from typing import TYPE_CHECKING, Any, Optional, Union
+from typing import TYPE_CHECKING, Any, Literal, Optional, Union
 import numpy as np
 import torch
@@ -13,20 +13,19 @@ from careamics.models.lvae.likelihoods import (
     LikelihoodModule,
     NoiseModelLikelihood,
 )
-from careamics.models.lvae.utils import compute_batch_mean
 if TYPE_CHECKING:
-    from careamics.losses.loss_factory import LVAELossParameters
+    from careamics.config import LVAELossConfig
 Likelihood = Union[LikelihoodModule, GaussianLikelihood, NoiseModelLikelihood]
 def get_reconstruction_loss(
-    reconstruction: torch.Tensor,  # TODO: naming -> predictions?
+    reconstruction: torch.Tensor,
     target: torch.Tensor,
     likelihood_obj: Likelihood,
 ) -> dict[str, torch.Tensor]:
-    """Compute the reconstruction loss.
+    """Compute the reconstruction loss (negative log-likelihood).
     Parameters
     ----------
@@ -42,65 +41,15 @@ def get_reconstruction_loss(
     Returns
     -------
-    dict[str, torch.Tensor]
-        A dictionary containing the overall loss `["loss"]` and the loss for
-        individual output channels `["ch{i}_loss"]`.
+    torch.Tensor
+        The recontruction loss (negative log-likelihood).
     """
-    loss_dict = _get_reconstruction_loss_vector(
-        reconstruction=reconstruction,
-        target=target,
-        likelihood_obj=likelihood_obj,
-    )
-    loss_dict["loss"] = loss_dict["loss"].sum() / len(reconstruction)
-    for i in range(1, 1 + target.shape[1]):
-        key = f"ch{i}_loss"
-        loss_dict[key] = loss_dict[key].sum() / len(reconstruction)
-    return loss_dict
-def _get_reconstruction_loss_vector(
-    reconstruction: torch.Tensor,  # TODO: naming -> predictions?
-    target: torch.Tensor,
-    likelihood_obj: LikelihoodModule,
-) -> dict[str, torch.Tensor]:
-    """Compute the reconstruction loss.
-    Parameters
-    ----------
-    return_predicted_img: bool
-        If set to `True`, the besides the loss, the reconstructed image is returned.
-        Default is `False`.
-    Returns
-    -------
-    dict[str, torch.Tensor]
-        A dictionary containing the overall loss `["loss"]` and the loss for
-        individual output channels `["ch{i}_loss"]`. Shape of individual
-        tensors is (B, ).
-    """
-    output = {"loss": None}
-    for i in range(1, 1 + target.shape[1]):
-        output[f"ch{i}_loss"] = None
     # Compute Log likelihood
     ll, _ = likelihood_obj(reconstruction, target)  # shape: (B, C, [Z], Y, X)
-    output = {"loss": compute_batch_mean(-1 * ll)}  # shape: (B, )
-    if ll.shape[1] > 1:  # target_ch > 1
-        for i in range(1, 1 + target.shape[1]):
-            output[f"ch{i}_loss"] = compute_batch_mean(-ll[:, i - 1])  # shape: (B, )
-    else:  # target_ch == 1
-        # TODO: hacky!!! Refactor this
-        assert ll.shape[1] == 1
-        output["ch1_loss"] = output["loss"]
-        output["ch2_loss"] = output["loss"]
-    return output
+    return -1 * ll.mean()
-def reconstruction_loss_musplit_denoisplit(
+def _reconstruction_loss_musplit_denoisplit(
     predictions: Union[torch.Tensor, tuple[torch.Tensor, torch.Tensor]],
     targets: torch.Tensor,
     nm_likelihood: NoiseModelLikelihood,
@@ -137,62 +86,120 @@ def reconstruction_loss_musplit_denoisplit(
     recons_loss : torch.Tensor
         The reconstruction loss. Shape is (1, ).
     """
-    # TODO: refactor this function to make it closer to `get_reconstruction_loss`
-    # (or viceversa)
     if predictions.shape[1] == 2 * targets.shape[1]:
         # predictions contain both mean and log-variance
-        out_mean, _ = predictions.chunk(2, dim=1)
+        pred_mean, _ = predictions.chunk(2, dim=1)
     else:
-        out_mean = predictions
+        pred_mean = predictions
+    recons_loss_nm = get_reconstruction_loss(
+        reconstruction=pred_mean, target=targets, likelihood_obj=nm_likelihood
+    )
+    recons_loss_gm = get_reconstruction_loss(
+        reconstruction=predictions,
+        target=targets,
+        likelihood_obj=gaussian_likelihood,
+    )
-    recons_loss_nm = -1 * nm_likelihood(out_mean, targets)[0].mean()
-    recons_loss_gm = -1 * gaussian_likelihood(predictions, targets)[0].mean()
     recons_loss = nm_weight * recons_loss_nm + gaussian_weight * recons_loss_gm
     return recons_loss
-def get_kl_divergence_loss_usplit(
-    topdown_data: dict[str, list[torch.Tensor]], kl_key: str = "kl"
+def get_kl_divergence_loss(
+    kl_type: Literal["kl", "kl_restricted"],
+    topdown_data: dict[str, torch.Tensor],
+    rescaling: Literal["latent_dim", "image_dim"],
+    aggregation: Literal["mean", "sum"],
+    free_bits_coeff: float,
+    img_shape: Optional[tuple[int]] = None,
 ) -> torch.Tensor:
-    """Compute the KL divergence loss for muSplit.
+    """Compute the KL divergence loss.
+    NOTE: Description of `rescaling` methods:
+    - If "latent_dim", the KL-loss values are rescaled w.r.t. the latent space
+    dimensions (spatial + number of channels, i.e., (C, [Z], Y, X)). In this way they
+    have the same magnitude across layers.
+    - If "image_dim", the KL-loss values are rescaled w.r.t. the input image spatial
+    dimensions. In this way, the lower layers have a larger KL-loss value compared to
+    the higher layers, since the latent space and hence the KL tensor has more entries.
+    Specifically, at hierarchy `i`, the total KL loss is larger by a factor (128/i**2).
+    NOTE: the type of `aggregation` determines the magnitude of the KL-loss. Clearly,
+    "sum" aggregation results in a larger KL-loss value compared to "mean" by a factor
+    of `n_layers`.
+    NOTE: recall that sample-wise KL is obtained by summing over all dimensions,
+    including Z. Also recall that in current 3D implementation of LVAE, no downsampling
+    is done on Z. Therefore, to avoid emphasizing KL loss too much, we divide it
+    by the Z dimension of input image in every case.
     Parameters
     ----------
-    topdown_data : dict[str, list[torch.Tensor]]
+    kl_type : Literal["kl", "kl_restricted"]
+        The type of KL divergence loss to compute.
+    topdown_data : dict[str, torch.Tensor]
         A dictionary containing information computed for each layer during the top-down
         pass. The dictionary must include the following keys:
         - "kl": The KL-loss values for each layer. Shape of each tensor is (B,).
         - "z": The sampled latents for each layer. Shape of each tensor is
         (B, layers, `z_dims[i]`, H, W).
-    kl_key : str
-        The key for the KL-loss values in the top-down layer data dictionary.
-        To choose among ["kl", "kl_restricted", "kl_spatial", "kl_channelwise"]
-        Default is "kl".
+    rescaling : Literal["latent_dim", "image_dim"]
+        The rescaling method used for the KL-loss values. If "latent_dim", the KL-loss
+        values are rescaled w.r.t. the latent space dimensions (spatial + number of
+        channels, i.e., (C, [Z], Y, X)). If "image_dim", the KL-loss values are
+        rescaled w.r.t. the input image spatial dimensions.
+    aggregation : Literal["mean", "sum"]
+        The aggregation method used to combine the KL-loss values across layers. If
+        "mean", the KL-loss values are averaged across layers. If "sum", the KL-loss
+        values are summed across layers.
+    free_bits_coeff : float
+        The free bits coefficient used for the KL-loss computation.
+    img_shape : Optional[tuple[int]]
+        The shape of the input image to the LVAE model. Shape is ([Z], Y, X).
+    Returns
+    -------
+    kl_loss : torch.Tensor
+        The KL divergence loss. Shape is (1, ).
     """
     kl = torch.cat(
-        [kl_layer.unsqueeze(1) for kl_layer in topdown_data[kl_key]], dim=1
+        [kl_layer.unsqueeze(1) for kl_layer in topdown_data[kl_type]],
+        dim=1,
     )  # shape: (B, n_layers)
-    # NOTE: Values are sum() and so are of the order 30000
-    nlayers = kl.shape[1]
-    for i in range(nlayers):
-        # NOTE: we want to normalize the KL-loss w.r.t. the latent space dimensions,
-        # i.e., the number of entries in the latent space tensors (C, [Z], Y, X).
-        # We assume z has shape (B, C, [Z], Y, X), where `C = z_dims[i]`.
-        norm_factor = np.prod(topdown_data["z"][i].shape[1:])
-        kl[:, i] = kl[:, i] / norm_factor
+    # Apply free bits (& batch average)
+    kl = free_bits_kl(kl, free_bits_coeff)  # shape: (n_layers,)
-    kl_loss = free_bits_kl(kl, 0.0).mean()  # shape: (1, )
-    # NOTE: free_bits disabled!
-    return kl_loss
+    # In 3D case, rescale by Z dim
+    # TODO If we have downsampling in Z dimension, then this needs to change.
+    if len(img_shape) == 3:
+        kl = kl / img_shape[0]
+    # Rescaling
+    if rescaling == "latent_dim":
+        for i in range(len(kl)):
+            latent_dim = topdown_data["z"][i].shape[1:]
+            norm_factor = np.prod(latent_dim)
+            kl[i] = kl[i] / norm_factor
+    elif rescaling == "image_dim":
+        kl = kl / np.prod(img_shape[-2:])
-def get_kl_divergence_loss_denoisplit(
+    # Aggregation
+    if aggregation == "mean":
+        kl = kl.mean()  # shape: (1,)
+    elif aggregation == "sum":
+        kl = kl.sum()  # shape: (1,)
+    return kl
+def _get_kl_divergence_loss_musplit(
     topdown_data: dict[str, torch.Tensor],
     img_shape: tuple[int],
-    kl_key: str = "kl",
+    kl_type: Literal["kl", "kl_restricted"],
 ) -> torch.Tensor:
-    """Compute the KL divergence loss for denoiSplit.
+    """Compute the KL divergence loss for muSplit.
     Parameters
     ----------
@@ -204,32 +211,57 @@ def get_kl_divergence_loss_denoisplit(
         (B, layers, `z_dims[i]`, H, W).
     img_shape : tuple[int]
         The shape of the input image to the LVAE model. Shape is ([Z], Y, X).
-    kl_key : str
-        The key for the KL-loss values in the top-down layer data dictionary.
-        To choose among ["kl", "kl_restricted", "kl_spatial", "kl_channelwise"]
-        Default is "kl"
+    kl_type : Literal["kl", "kl_restricted"]
+        The type of KL divergence loss to compute.
-    kl[i] for each i has length batch_size resulting kl shape: (bs, layers).
+    Returns
+    -------
+    kl_loss : torch.Tensor
+        The KL divergence loss for the muSplit case. Shape is (1, ).
     """
-    kl = torch.cat(
-        [kl_layer.unsqueeze(1) for kl_layer in topdown_data[kl_key]],
-        dim=1,
+    return get_kl_divergence_loss(
+        kl_type="kl",  # TODO: hardcoded, deal in future PR
+        topdown_data=topdown_data,
+        rescaling="latent_dim",
+        aggregation="mean",
+        free_bits_coeff=0.0,
+        img_shape=img_shape,
     )
-    kl_loss = free_bits_kl(kl, 1.0).sum()
-    # NOTE: as compared to uSplit kl divergence, this KL loss is larger by a factor of
-    # `n_layers` since we sum KL contributions from different layers instead of taking
-    # the mean.
-    # NOTE: at each hierarchy, the KL loss is larger by a factor of (128/i**2).
-    # 128/(2*2) = 32 (bottommost layer)
-    # 128/(4*4) = 8
-    # 128/(8*8) = 2
-    # 128/(16*16) = 0.5 (topmost layer)
+def _get_kl_divergence_loss_denoisplit(
+    topdown_data: dict[str, torch.Tensor],
+    img_shape: tuple[int],
+    kl_type: Literal["kl", "kl_restricted"],
+) -> torch.Tensor:
+    """Compute the KL divergence loss for denoiSplit.
-    # Normalize the KL-loss w.r.t. the input image spatial dimensions (e.g., 64x64)
-    kl_loss = kl_loss / np.prod(img_shape)
-    return kl_loss
+    Parameters
+    ----------
+    topdown_data : dict[str, torch.Tensor]
+        A dictionary containing information computed for each layer during the top-down
+        pass. The dictionary must include the following keys:
+        - "kl": The KL-loss values for each layer. Shape of each tensor is (B,).
+        - "z": The sampled latents for each layer. Shape of each tensor is
+        (B, layers, `z_dims[i]`, H, W).
+    img_shape : tuple[int]
+        The shape of the input image to the LVAE model. Shape is ([Z], Y, X).
+    kl_type : Literal["kl", "kl_restricted"]
+        The type of KL divergence loss to compute.
+    Returns
+    -------
+    kl_loss : torch.Tensor
+        The KL divergence loss for the denoiSplit case. Shape is (1, ).
+    """
+    return get_kl_divergence_loss(
+        kl_type=kl_type,
+        topdown_data=topdown_data,
+        rescaling="image_dim",
+        aggregation="sum",
+        free_bits_coeff=1.0,
+        img_shape=img_shape,
+    )
 # TODO: @melisande-c suggested to refactor this as a class (see PR #208)
@@ -240,7 +272,9 @@ def get_kl_divergence_loss_denoisplit(
 def musplit_loss(
     model_outputs: tuple[torch.Tensor, dict[str, Any]],
     targets: torch.Tensor,
-    loss_parameters: LVAELossParameters,
+    config: LVAELossConfig,
+    gaussian_likelihood: Optional[GaussianLikelihood],
+    noise_model_likelihood: Optional[NoiseModelLikelihood] = None,  # TODO: ugly
 ) -> Optional[dict[str, torch.Tensor]]:
     """Loss function for muSplit.
@@ -252,9 +286,13 @@ def musplit_loss(
     targets : torch.Tensor
         The target image used to compute the reconstruction loss. Shape is
         (B, `target_ch`, [Z], Y, X).
-    loss_parameters : LVAELossParameters
-        The loss parameters for muSplit (e.g., KL hyperparameters, likelihood module,
+    config : LVAELossConfig
+        The config for loss function (e.g., KL hyperparameters, likelihood module,
         noise model, etc.).
+    gaussian_likelihood : GaussianLikelihood
+        The Gaussian likelihood object.
+    noise_model_likelihood : Optional[NoiseModelLikelihood]
+        The noise model likelihood object. Not used here.
     Returns
     -------
@@ -262,27 +300,35 @@ def musplit_loss(
         A dictionary containing the overall loss `["loss"]`, the reconstruction loss
         `["reconstruction_loss"]`, and the KL divergence loss `["kl_loss"]`.
     """
+    assert gaussian_likelihood is not None
     predictions, td_data = model_outputs
     # Reconstruction loss computation
-    recons_loss_dict = get_reconstruction_loss(
+    recons_loss = config.reconstruction_weight * get_reconstruction_loss(
         reconstruction=predictions,
         target=targets,
-        likelihood_obj=loss_parameters.gaussian_likelihood,
+        likelihood_obj=gaussian_likelihood,
     )
-    recons_loss = recons_loss_dict["loss"] * loss_parameters.reconstruction_weight
     if torch.isnan(recons_loss).any():
         recons_loss = 0.0
     # KL loss computation
     kl_weight = get_kl_weight(
-        loss_parameters.kl_annealing,
-        loss_parameters.kl_start,
-        loss_parameters.kl_annealtime,
-        loss_parameters.kl_weight,
-        loss_parameters.current_epoch,
+        config.kl_params.annealing,
+        config.kl_params.start,
+        config.kl_params.annealtime,
+        config.kl_weight,
+        config.kl_params.current_epoch,
+    )
+    kl_loss = (
+        _get_kl_divergence_loss_musplit(
+            topdown_data=td_data,
+            img_shape=targets.shape[2:],
+            kl_type=config.kl_params.loss_type,
+        )
+        * kl_weight
     )
-    kl_loss = kl_weight * get_kl_divergence_loss_usplit(td_data)
     net_loss = recons_loss + kl_loss
     output = {
@@ -304,7 +350,9 @@ def musplit_loss(
 def denoisplit_loss(
     model_outputs: tuple[torch.Tensor, dict[str, Any]],
     targets: torch.Tensor,
-    loss_parameters: LVAELossParameters,
+    config: LVAELossConfig,
+    gaussian_likelihood: Optional[GaussianLikelihood] = None,
+    noise_model_likelihood: Optional[NoiseModelLikelihood] = None,
 ) -> Optional[dict[str, torch.Tensor]]:
     """Loss function for DenoiSplit.
@@ -316,9 +364,12 @@ def denoisplit_loss(
     targets : torch.Tensor
         The target image used to compute the reconstruction loss. Shape is
         (B, `target_ch`, [Z], Y, X).
-    loss_parameters : LVAELossParameters
-        The loss parameters for muSplit (e.g., KL hyperparameters, likelihood module,
-        noise model, etc.).
+    config : LVAELossConfig
+        The config for loss function containing all loss hyperparameters.
+    gaussian_likelihood : GaussianLikelihood
+        The Gaussian likelihood object.
+    noise_model_likelihood : NoiseModelLikelihood
+        The noise model likelihood object.
     Returns
     -------
@@ -326,33 +377,35 @@ def denoisplit_loss(
         A dictionary containing the overall loss `["loss"]`, the reconstruction loss
         `["reconstruction_loss"]`, and the KL divergence loss `["kl_loss"]`.
     """
+    assert noise_model_likelihood is not None
     predictions, td_data = model_outputs
     # Reconstruction loss computation
-    recons_loss_dict = get_reconstruction_loss(
+    recons_loss = config.reconstruction_weight * get_reconstruction_loss(
         reconstruction=predictions,
         target=targets,
-        likelihood_obj=loss_parameters.noise_model_likelihood,
+        likelihood_obj=noise_model_likelihood,
     )
-    recons_loss = recons_loss_dict["loss"] * loss_parameters.reconstruction_weight
     if torch.isnan(recons_loss).any():
         recons_loss = 0.0
     # KL loss computation
-    if loss_parameters.non_stochastic:  # TODO always false ?
-        kl_loss = torch.Tensor([0.0]).cuda()
-    else:
-        kl_weight = get_kl_weight(
-            loss_parameters.kl_annealing,
-            loss_parameters.kl_start,
-            loss_parameters.kl_annealtime,
-            loss_parameters.kl_weight,
-            loss_parameters.current_epoch,
-        )
-        kl_loss = kl_weight * get_kl_divergence_loss_denoisplit(
+    kl_weight = get_kl_weight(
+        config.kl_params.annealing,
+        config.kl_params.start,
+        config.kl_params.annealtime,
+        config.kl_weight,
+        config.kl_params.current_epoch,
+    )
+    kl_loss = (
+        _get_kl_divergence_loss_denoisplit(
             topdown_data=td_data,
-            img_shape=targets.shape[2:],  # input img spatial dims
+            img_shape=targets.shape[2:],
+            kl_type=config.kl_params.loss_type,
         )
+        * kl_weight
+    )
     net_loss = recons_loss + kl_loss
     output = {
@@ -374,7 +427,9 @@ def denoisplit_loss(
 def denoisplit_musplit_loss(
     model_outputs: tuple[torch.Tensor, dict[str, Any]],
     targets: torch.Tensor,
-    loss_parameters: LVAELossParameters,
+    config: LVAELossConfig,
+    gaussian_likelihood: GaussianLikelihood,
+    noise_model_likelihood: NoiseModelLikelihood,
 ) -> Optional[dict[str, torch.Tensor]]:
     """Loss function for DenoiSplit.
@@ -386,9 +441,12 @@ def denoisplit_musplit_loss(
     targets : torch.Tensor
         The target image used to compute the reconstruction loss. Shape is
         (B, `target_ch`, [Z], Y, X).
-    loss_parameters : LVAELossParameters
-        The loss parameters for muSplit (e.g., KL hyperparameters, likelihood module,
-        noise model, etc.).
+    config : LVAELossConfig
+        The config for loss function containing all loss hyperparameters.
+    gaussian_likelihood : GaussianLikelihood
+        The Gaussian likelihood object.
+    noise_model_likelihood : NoiseModelLikelihood
+        The noise model likelihood object.
     Returns
     -------
@@ -399,34 +457,35 @@ def denoisplit_musplit_loss(
     predictions, td_data = model_outputs
     # Reconstruction loss computation
-    recons_loss = reconstruction_loss_musplit_denoisplit(
+    recons_loss = _reconstruction_loss_musplit_denoisplit(
         predictions=predictions,
         targets=targets,
-        nm_likelihood=loss_parameters.noise_model_likelihood,
-        gaussian_likelihood=loss_parameters.gaussian_likelihood,
-        nm_weight=loss_parameters.denoisplit_weight,
-        gaussian_weight=loss_parameters.musplit_weight,
+        nm_likelihood=noise_model_likelihood,
+        gaussian_likelihood=gaussian_likelihood,
+        nm_weight=config.denoisplit_weight,
+        gaussian_weight=config.musplit_weight,
     )
     if torch.isnan(recons_loss).any():
         recons_loss = 0.0
     # KL loss computation
-    if loss_parameters.non_stochastic:  # TODO always false ?
-        kl_loss = torch.Tensor([0.0]).cuda()
-    else:
-        # NOTE: 'kl' key stands for the 'kl_samplewise' key in the TopDownLayer class.
-        # The different naming comes from `top_down_pass()` method in the LadderVAE.
-        denoisplit_kl = get_kl_divergence_loss_denoisplit(
-            topdown_data=td_data,
-            img_shape=targets.shape[2:],  # input img spatial dims
-        )
-        musplit_kl = get_kl_divergence_loss_usplit(td_data)
-        kl_loss = (
-            loss_parameters.denoisplit_weight * denoisplit_kl
-            + loss_parameters.musplit_weight * musplit_kl
-        )
-        # TODO `kl_weight` is hardcoded (???)
-        kl_loss = loss_parameters.kl_weight * kl_loss
+    # NOTE: 'kl' key stands for the 'kl_samplewise' key in the TopDownLayer class.
+    # The different naming comes from `top_down_pass()` method in the LadderVAE.
+    denoisplit_kl = _get_kl_divergence_loss_denoisplit(
+        topdown_data=td_data,
+        img_shape=targets.shape[2:],
+        kl_type=config.kl_params.loss_type,
+    )
+    musplit_kl = _get_kl_divergence_loss_musplit(
+        topdown_data=td_data,
+        img_shape=targets.shape[2:],
+        kl_type=config.kl_params.loss_type,
+    )
+    kl_loss = (
+        config.denoisplit_weight * denoisplit_kl + config.musplit_weight * musplit_kl
+    )
+    # TODO `kl_weight` is hardcoded (???)
+    kl_loss = config.kl_weight * kl_loss
     net_loss = recons_loss + kl_loss
     output = {

careamics 0.0.4.2__py3-none-any.whl → 0.0.6__py3-none-any.whl

Potentially problematic release.

careamics 0.0.4.2py3-none-any.whl → 0.0.6py3-none-any.whl