PyPI - reflectorch - Versions diffs - 1.2.1__py3-none-any.whl → 1.4.0__py3-none-any.whl - Mend

reflectorch 1.2.1py3-none-any.whl → 1.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of reflectorch might be problematic. Click here for more details.

Files changed (41) hide show

reflectorch/data_generation/__init__.py +4 -0
reflectorch/data_generation/dataset.py +27 -7
reflectorch/data_generation/noise.py +115 -9
reflectorch/data_generation/priors/parametric_models.py +91 -16
reflectorch/data_generation/priors/parametric_subpriors.py +28 -7
reflectorch/data_generation/priors/sampler_strategies.py +67 -3
reflectorch/data_generation/q_generator.py +97 -43
reflectorch/data_generation/reflectivity/__init__.py +53 -11
reflectorch/data_generation/reflectivity/kinematical.py +4 -5
reflectorch/data_generation/reflectivity/smearing.py +25 -10
reflectorch/data_generation/reflectivity/smearing_pointwise.py +110 -0
reflectorch/data_generation/smearing.py +42 -11
reflectorch/data_generation/utils.py +93 -18
reflectorch/extensions/refnx/refnx_conversion.py +77 -0
reflectorch/inference/inference_model.py +795 -159
reflectorch/inference/loading_data.py +37 -0
reflectorch/inference/plotting.py +517 -0
reflectorch/inference/preprocess_exp/interpolation.py +5 -2
reflectorch/inference/scipy_fitter.py +98 -7
reflectorch/ml/__init__.py +2 -0
reflectorch/ml/basic_trainer.py +18 -6
reflectorch/ml/callbacks.py +5 -4
reflectorch/ml/loggers.py +25 -0
reflectorch/ml/schedulers.py +116 -0
reflectorch/ml/trainers.py +131 -23
reflectorch/models/__init__.py +2 -1
reflectorch/models/encoders/__init__.py +2 -2
reflectorch/models/encoders/conv_encoder.py +54 -40
reflectorch/models/encoders/fno.py +23 -16
reflectorch/models/encoders/integral_kernel_embedding.py +390 -0
reflectorch/models/networks/__init__.py +2 -0
reflectorch/models/networks/mlp_networks.py +331 -153
reflectorch/models/networks/residual_net.py +31 -5
reflectorch/runs/train.py +0 -1
reflectorch/runs/utils.py +48 -11
reflectorch/utils.py +30 -0
{reflectorch-1.2.1.dist-info → reflectorch-1.4.0.dist-info}/METADATA +20 -17
{reflectorch-1.2.1.dist-info → reflectorch-1.4.0.dist-info}/RECORD +41 -36
{reflectorch-1.2.1.dist-info → reflectorch-1.4.0.dist-info}/WHEEL +1 -1
{reflectorch-1.2.1.dist-info → reflectorch-1.4.0.dist-info/licenses}/LICENSE.txt +0 -0
{reflectorch-1.2.1.dist-info → reflectorch-1.4.0.dist-info}/top_level.txt +0 -0

reflectorch/models/encoders/conv_encoder.py CHANGED Viewed

@@ -11,7 +11,6 @@ __all__ = [
     "ConvEncoder",
     "ConvDecoder",
     "ConvAutoencoder",
-    "ConvVAE",
 ]
 logger = logging.getLogger(__name__)
@@ -23,7 +22,7 @@ class ConvEncoder(nn.Module):
     Args:
         in_channels (int, optional): the number of input channels. Defaults to 1.
         hidden_channels (tuple, optional): the number of intermediate channels of each convolutional layer. Defaults to (32, 64, 128, 256, 512).
-        dim_latent (int, optional): the dimension of the output latent embedding. Defaults to 64.
+        dim_embedding (int, optional): the dimension of the output latent embedding. Defaults to 64.
         dim_avpool (int, optional): the output size of the adaptive average pooling layer. Defaults to 1.
         use_batch_norm (bool, optional): whether to use batch normalization. Defaults to True.
         activation (str, optional): the type of activation function. Defaults to 'relu'.
@@ -31,9 +30,11 @@ class ConvEncoder(nn.Module):
     def __init__(self,
                  in_channels: int = 1,
                  hidden_channels: tuple = (32, 64, 128, 256, 512),
-                 dim_latent: int = 64,
+                 kernel_size: int = 3,
+                 dim_embedding: int = 64,
                  dim_avpool: int = 1,
                  use_batch_norm: bool = True,
+                 use_se: bool = False,
                  activation: str = 'relu',
                  ):
         super().__init__()
@@ -44,22 +45,24 @@ class ConvEncoder(nn.Module):
         for h in hidden_channels:
             layers = [
-                nn.Conv1d(in_channels, out_channels=h, kernel_size=3, stride=2, padding=1),
+                nn.Conv1d(in_channels, out_channels=h, kernel_size=kernel_size, stride=2, padding=kernel_size // 2),
                 activation(),
             ]
             if use_batch_norm:
                 layers.insert(1, nn.BatchNorm1d(h))
+            if use_se:
+                layers.insert(2, SEBlock(h))
             modules.append(nn.Sequential(*layers))
             in_channels = h
         self.core = nn.Sequential(*modules)
         self.avpool = nn.AdaptiveAvgPool1d(dim_avpool)
-        self.fc = nn.Linear(hidden_channels[-1] * dim_avpool, dim_latent)
+        self.fc = nn.Linear(hidden_channels[-1] * dim_avpool, dim_embedding)
     def forward(self, x):
-        """"""
         if len(x.shape) < 3:
             x = x.unsqueeze(1)
         x = self.core(x)
@@ -100,6 +103,7 @@ class ConvDecoder(nn.Module):
                  hidden_channels: tuple = (512, 256, 128, 64, 32),
                  dim_latent: int = 64,
                  in_size: int = 8,
+                 kernel_size: int = 3,
                  use_batch_norm: bool = True,
                  activation: str = 'relu',
                  ):
@@ -119,9 +123,9 @@ class ConvDecoder(nn.Module):
                     nn.ConvTranspose1d(
                         hidden_channels[i],
                         hidden_channels[i + 1],
-                        kernel_size=3,
+                        kernel_size=kernel_size, #3
                         stride=2,
-                        padding=1,
+                        padding=kernel_size // 2, #1
                         output_padding=1,
                     ),
                     nn.BatchNorm1d(hidden_channels[i + 1]) if use_batch_norm else nn.Identity(),
@@ -134,9 +138,9 @@ class ConvDecoder(nn.Module):
         self.final_layer = nn.Sequential(
             nn.ConvTranspose1d(hidden_channels[-1],
                                hidden_channels[-1],
-                               kernel_size=3,
+                               kernel_size=kernel_size, #3
                                stride=2,
-                               padding=1,
+                               padding=kernel_size // 2, #1
                                output_padding=1),
             nn.BatchNorm1d(hidden_channels[-1]) if use_batch_norm else nn.Identity(),
             activation(),
@@ -160,46 +164,56 @@ class ConvAutoencoder(nn.Module):
                  decoder_hidden_channels: tuple = (512, 256, 128, 64, 32),
                  dim_latent: int = 64,
                  dim_avpool: int = 1,
+                 kernel_size: int = 3,
                  use_batch_norm: bool = True,
                  activation: str = 'relu',
                  decoder_in_size: int = 8,
                  **kwargs
                  ):
         super().__init__()
-        self.encoder = ConvEncoder(in_channels, encoder_hidden_channels, dim_latent, dim_avpool, use_batch_norm, activation, **kwargs)
-        self.decoder = ConvDecoder(decoder_hidden_channels, dim_latent, decoder_in_size, use_batch_norm, activation, **kwargs)
+        self.encoder = ConvEncoder(
+            in_channels=in_channels,
+            hidden_channels=encoder_hidden_channels,
+            kernel_size=kernel_size,
+            dim_embedding=dim_latent,
+            dim_avpool=dim_avpool,
+            use_batch_norm=use_batch_norm,
+            activation=activation,
+            **kwargs)
+        self.decoder = ConvDecoder(
+            hidden_channels=decoder_hidden_channels,
+            dim_latent=dim_latent,
+            in_size=decoder_in_size,
+            kernel_size=kernel_size,
+            use_batch_norm=use_batch_norm,
+            activation=activation,
+            **kwargs)
     def forward(self, x):
         return self.decoder(self.encoder(x))
-class ConvVAE(nn.Module):
-    """A 1D convolutional variational autoencoder"""
-    def __init__(self,
-                 in_channels: int = 1,
-                 encoder_hidden_channels: tuple = (32, 64, 128, 256, 512),
-                 decoder_hidden_channels: tuple = (512, 256, 128, 64, 32),
-                 dim_latent: int = 64,
-                 dim_avpool: int = 1,
-                 use_batch_norm: bool = True,
-                 activation: str = 'relu',
-                 decoder_in_size: int = 8,
-                 **kwargs
-                 ):
+class SEBlock(nn.Module):
+    """Squeeze-and-excitation block (https://arxiv.org/abs/1709.01507) """
+    def __init__(self, in_channels, reduction=16):
         super().__init__()
-        self.encoder = ConvEncoder(in_channels, encoder_hidden_channels, 2*dim_latent, dim_avpool, use_batch_norm, activation, **kwargs)
-        self.decoder = ConvDecoder(decoder_hidden_channels, dim_latent, decoder_in_size, use_batch_norm, activation, **kwargs)
+        self.fc1 = nn.Linear(in_channels, in_channels // reduction, bias=False)
+        self.fc2 = nn.Linear(in_channels // reduction, in_channels, bias=False)
+        self.relu = nn.ReLU()
+        self.sigmoid = nn.Sigmoid()
+        self.global_avg_pool = nn.AdaptiveAvgPool1d(1)
     def forward(self, x):
-        z_mu, z_logvar = self.encoder(x).chunk(2, dim=-1)
-        z = self.reparameterize(z_mu, z_logvar)
-        x_r_mu, x_r_logvar = self.decoder(z).chunk(2, dim=-1)
-        x = self.reparameterize(x_r_mu, x_r_logvar)
-        return x, (z_mu, z_logvar, x_r_mu, x_r_logvar)
-    @staticmethod
-    def reparameterize(mu, logvar):
-        std = torch.exp(0.5 * logvar)
-        eps = torch.randn_like(std).to(std)
-        return mu + eps * std
+        batch_size, channels, _ = x.size()
+        #Squeeze
+        se = self.global_avg_pool(x).view(batch_size, channels)
+        #Excitation
+        se = self.fc1(se)
+        se = self.relu(se)
+        se = self.fc2(se)
+        se = self.sigmoid(se).view(batch_size, channels, 1)
+        #Scale the input feature maps (channel-wise attention)
+        return x * se

reflectorch/models/encoders/fno.py CHANGED Viewed

@@ -46,28 +46,30 @@ class FnoEncoder(nn.Module):
         :align: center
     Args:
-        ch_in (int): number of input channels
+        in_channels (int): number of input channels
         dim_embedding (int): dimension of the output embedding
         modes (int): number of Fourier modes
         width_fno (int): number of channels of the intermediate representations
         n_fno_blocks (int): number of FNO blocks
         activation (str): the activation function
-        fusion_self_attention (bool): if ``True`` a fusion layer is used after the FNO blocks to produce the final embedding
+        fusion_self_attention (bool): whether to use fusion self attention for merging the tokens (instead of mean)
+        fsa_activation (str): the activation function of the fusion self attention block
     """
     def __init__(
             self,
-            ch_in: int = 2,
+            in_channels: int = 2,
             dim_embedding: int = 128,
             modes: int = 32,
             width_fno: int = 64,
             n_fno_blocks: int = 6,
             activation: str = 'gelu',
             fusion_self_attention: bool = False,
+            fsa_activation: str = 'tanh',
             ):
         super().__init__()
-        self.ch_in = ch_in
+        self.in_channels = in_channels
         self.dim_embedding = dim_embedding
         self.modes = modes
@@ -77,13 +79,17 @@ class FnoEncoder(nn.Module):
         self.fusion_self_attention = fusion_self_attention
-        self.fc0 = nn.Linear(ch_in, width_fno) #(r(q), q)
-        self.spectral_convs = nn.ModuleList([SpectralConv1d(in_channels=width_fno, out_channels=width_fno, modes=modes) for _ in range(n_fno_blocks)])
-        self.w_convs = nn.ModuleList([nn.Conv1d(in_channels=width_fno, out_channels=width_fno, kernel_size=1) for _ in range(n_fno_blocks)])
+        self.fc0 = nn.Linear(in_channels, width_fno) #(r(q), q)
+        self.spectral_convs = nn.ModuleList([
+            SpectralConv1d(in_channels=width_fno, out_channels=width_fno, modes=modes) for _ in range(n_fno_blocks)
+            ])
+        self.w_convs = nn.ModuleList([
+            nn.Conv1d(in_channels=width_fno, out_channels=width_fno, kernel_size=1) for _ in range(n_fno_blocks)
+            ])
         self.fc_out = nn.Linear(width_fno, dim_embedding)
         if fusion_self_attention:
-            self.fusion = FusionSelfAttention(width_fno, 2*width_fno)
+            self.fusion = FusionSelfAttention(embed_dim=width_fno, hidden_dim=2*width_fno, activation=fsa_activation)
     def forward(self, x):
         """"""
@@ -109,19 +115,20 @@ class FnoEncoder(nn.Module):
         return x
 class FusionSelfAttention(nn.Module):
-    def __init__(self,
-                 embed_dim: int = 64,
-                 hidden_dim: int = 64,
-                 activation=nn.Tanh,
-                 ):
+    def __init__(self, embed_dim: int = 64, hidden_dim: int = 64, activation: str = 'gelu'):
         super().__init__()
+        activation = activation_by_name(activation)()
         self.fuser = nn.Sequential(nn.Linear(embed_dim, hidden_dim),
-                                   activation(),
+                                   activation,
                                    nn.Linear(hidden_dim, 1, bias=False))
-    def forward(self, c):  # (batch_size x seq_len x embed_dim)
+    def forward(self,
+                c: torch.Tensor,  # (batch_size x seq_len x embed_dim)
+                mask: torch.Tensor = None, # (batch_size x seq_len)
+                ):
         a = self.fuser(c)
-        alpha = torch.exp(a)
+        alpha = torch.exp(a)*mask.unsqueeze(-1) if mask is not None else torch.exp(a)
         alpha = alpha/alpha.sum(dim=1, keepdim=True)
         return (alpha*c).sum(dim=1)  # (batch_size x embed_dim)

reflectorch/models/encoders/integral_kernel_embedding.py ADDED Viewed

@@ -0,0 +1,390 @@
+from __future__ import annotations
+from typing import Union
+import torch
+from torch import nn, Tensor, stack, cat
+from reflectorch.models.activations import activation_by_name
+import reflectorch
+###embedding network adapted from the PANPE repository
+__all__ = [
+    "IntegralConvEmbedding",
+]
+class IntegralConvEmbedding(nn.Module):
+    def __init__(
+        self,
+        z_num: Union[int, tuple[int, ...]],
+        z_range: tuple[float, float] = None,
+        in_dim: int = 2,
+        kernel_coef: int = 16,
+        dim_embedding: int = 256,
+        conv_dims: tuple[int, ...] = (32, 64, 128),
+        num_blocks: int = 4,
+        use_batch_norm: bool = False,
+        use_layer_norm: bool = True,
+        use_fft: bool = False,
+        activation: str = "gelu",
+        conv_activation: str = "lrelu",
+        resnet_activation: str = "relu",
+    ) -> None:
+        super().__init__()
+        if isinstance(z_num, int):
+            z_num = (z_num,)
+        num_kernel = len(z_num)
+        if z_range is not None:
+            zs = [(z_range[0], z_range[1], nz) for nz in z_num]
+        else:
+            zs = z_num
+        self.in_dim = in_dim
+        self.kernels = nn.ModuleList(
+            [
+                IntegralKernelBlock(
+                    z,
+                    in_dim,
+                    kernel_coef=kernel_coef,
+                    latent_dim=dim_embedding,
+                    conv_dims=conv_dims,
+                    use_fft=use_fft,
+                    activation=activation,
+                    conv_activation=conv_activation,
+                )
+                for z in zs
+            ]
+        )
+        self.fc = reflectorch.models.networks.residual_net.ResidualMLP(
+            dim_in=dim_embedding * num_kernel,
+            dim_out=dim_embedding,
+            layer_width=2 * dim_embedding,
+            num_blocks=num_blocks,
+            use_batch_norm=use_batch_norm,
+            use_layer_norm=use_layer_norm,
+            activation=resnet_activation,
+        )
+    def forward(self, q, y, drop_mask=None) -> Tensor:
+        x = cat([kernel(q, y, drop_mask=drop_mask) for kernel in self.kernels], dim=-1)
+        x = self.fc(x)
+        return x
+class IntegralKernelBlock(nn.Module):
+    """
+    Examples:
+        >>> x = torch.rand(2, 100)
+        >>> y = torch.rand(2, 100, 3)
+        >>> block = IntegralKernelBlock((0, 1, 10), in_dim=3,  latent_dim=32)
+        >>> output = block(x, y)
+        >>> output.shape
+        torch.Size([2, 32])
+        >>> block = IntegralKernelBlock(10, in_dim=3,  latent_dim=32)
+        >>> output = block(x, y)
+        >>> output.shape
+        torch.Size([2, 32])
+    """
+    def __init__(
+        self,
+        z: tuple[float, float, int] or int,
+        in_dim: int,
+        kernel_coef: int = 2,
+        latent_dim: int = 32,
+        conv_dims: tuple[int, ...] = (32, 64, 128),
+        use_fft: bool = False,
+        activation: str = "gelu",
+        conv_activation: str = "lrelu",
+    ):
+        super().__init__()
+        if isinstance(z, int):
+            z_num = z
+            kernel = FullIntegralKernel(z_num, in_dim=in_dim, kernel_coef=kernel_coef)
+        else:
+            kernel = FastIntegralKernel(
+                z, in_dim=in_dim, kernel_coef=kernel_coef, activation=activation
+            )
+            z_num = z[-1]
+        assert z_num % 2 == 0, "z_num should be even"
+        self.kernel = kernel
+        self.z_num = z_num
+        self.in_dim = in_dim
+        self.latent_dim = latent_dim
+        self.use_fft = use_fft
+        self.fc_in_dim = self.latent_dim + self.in_dim * self.z_num
+        if self.use_fft:
+            self.fc_in_dim += self.in_dim * 2 + self.in_dim * self.z_num
+        self.conv = reflectorch.models.encoders.conv_encoder.ConvEncoder(
+            dim_avpool=8,
+            hidden_channels=conv_dims,
+            in_channels=in_dim,
+            dim_embedding=latent_dim,
+            activation=conv_activation,
+        )
+        self.fc = FCBlock(
+            in_dim=self.fc_in_dim, hid_dim=self.latent_dim * 2, out_dim=self.latent_dim
+        )
+    def forward(self, x: Tensor, y: Tensor, drop_mask: Tensor = None) -> Tensor:
+        x = self.kernel(x, y, drop_mask=drop_mask)
+        assert x.shape == (x.shape[0], self.in_dim, self.z_num)
+        xc = self.conv(x)  # (batch, latent_dim)
+        assert xc.shape == (x.shape[0], self.latent_dim)
+        if self.use_fft:
+            fft_x = torch.fft.rfft(x, dim=-1, norm="ortho")  # (batch, in_dim, z_num)
+            fft_x = torch.cat(
+                [fft_x.real, fft_x.imag], -1
+            )  # (batch, in_dim, 2 * z_num)
+            assert fft_x.shape == (x.shape[0], x.shape[1], self.z_num + 2)
+            fft_x = fft_x.flatten(1)  # (batch, in_dim * (z_num + 2))
+            x = torch.cat(
+                [x.flatten(1), fft_x, xc], -1
+            )  # (batch, in_dim * z_num * 3 + latent_dim)
+        else:
+            x = torch.cat([x.flatten(1), xc], -1)
+        assert (
+            x.shape[1] == self.fc_in_dim
+        ), f"Expected dim {self.fc_in_dim}, got {x.shape[1]}"
+        x = self.fc(x)  # (batch, latent_dim)
+        return x
+class FastIntegralKernel(nn.Module):
+    def __init__(
+        self,
+        z: tuple[float, float, int],
+        kernel_coef: int = 16,
+        in_dim: int = 1,
+        activation: str = "gelu",
+    ):
+        super().__init__()
+        z = torch.linspace(*z)
+        self.kernel = FCBlock(
+            in_dim + 2, kernel_coef * in_dim, in_dim, activation=activation
+        )
+        self.register_buffer("z", z)
+    def _get_z(self, x: Tensor):
+        # x.shape == (batch_size, num_x)
+        dz = self.z[1] - self.z[0]
+        indices = torch.ceil((x - self.z[0] - dz / 2) / dz).to(torch.int64)
+        z = torch.index_select(self.z, 0, indices.flatten()).view(*x.shape)
+        return z, indices
+    def forward(self, x: Tensor, y: Tensor, drop_mask=None):
+        z, indices = self._get_z(x)
+        xz = torch.stack([x, z], -1)
+        kernel_input = torch.cat([xz, y], -1)
+        output = self.kernel(kernel_input)  # (batch, x_num, in_dim)
+        output = compute_means(
+            output * y, indices, self.z.shape[-1], drop_mask=drop_mask
+        )  # (batch, z_num, in_dim)
+        output = output.swapaxes(1, 2)  # (batch, in_dim, z_num)
+        return output
+class FullIntegralKernel(nn.Module):
+    def __init__(
+        self,
+        z_num: int,
+        kernel_coef: int = 1,
+        in_dim: int = 1,
+    ):
+        super().__init__()
+        self.z_num = z_num
+        self.in_dim = in_dim
+        self.kernel = nn.Sequential(
+            nn.Linear(in_dim + 1, z_num * kernel_coef),
+            nn.LayerNorm(z_num * kernel_coef),
+            nn.ReLU(),
+            nn.Linear(z_num * kernel_coef, z_num * in_dim),
+        )
+    def forward(self, x: Tensor, y: Tensor, drop_mask=None):
+        # x.shape == (batch_size, num_x)
+        # y.shape == (batch_size, num_x, in_dim)
+        # drop_mask.shape == (batch_size, num_x)
+        batch_size, num_x = x.shape
+        kernel_input = torch.cat([x.unsqueeze(-1), y], -1)  # (batch, x_num, in_dim + 1)
+        x = self.kernel(kernel_input)  # (batch, x_num, z_num * in_dim)
+        x = x.reshape(
+            *x.shape[:-1], self.z_num, self.in_dim
+        )  # (batch, x_num, z_num, in_dim)
+        # permute to get (batch, z_num, x_num, in_dim)
+        x = x.permute(0, 2, 1, 3)
+        y = y.unsqueeze(1)  # (batch, 1, x_num, in_dim)
+        assert x.shape == (
+            batch_size,
+            self.z_num,
+            num_x,
+            self.in_dim,
+        )  # (batch, z_num, in_dim, x_num)
+        assert y.shape == (
+            batch_size,
+            1,
+            num_x,
+            self.in_dim,
+        )  # (batch, 1, x_num, in_dim)
+        if drop_mask is not None:
+            x = x * y
+            x = x.permute(0, 2, 1, 3)  # (batch, x_num, z_num, in_dim)
+            x = masked_mean(x, drop_mask)
+        else:
+            x = (x * y).mean(-2)  # (batch, z_num, in_dim)
+        assert x.shape == (batch_size, self.z_num, self.in_dim), f"{x.shape}"
+        x = x.swapaxes(1, 2)  # (batch, in_dim, z_num)
+        return x
+class FCBlock(nn.Module):
+    def __init__(
+        self,
+        in_dim: int = 2,
+        hid_dim: int = 16,
+        out_dim: int = 16,
+        activation: str = "gelu",
+    ):
+        super().__init__()
+        self.fc1 = nn.Linear(in_dim, hid_dim)
+        self.layer_norm = nn.LayerNorm(hid_dim)
+        self.activation = activation_by_name(activation)()
+        self.fc2 = nn.Linear(hid_dim, out_dim)
+    def forward(self, x: Tensor) -> Tensor:
+        x = self.fc1(x)
+        x = self.layer_norm(x)
+        x = self.activation(x)
+        x = self.fc2(x)
+        return x
+        # return self.kernel(x)
+def compute_means(x, indices, z: int, drop_mask: Tensor = None):
+    """
+    Compute the mean values of tensor 'x' for each unique index in 'indices' across each batch.
+    This function calculates the mean of elements in 'x' that correspond to each unique index in 'indices'.
+    The computation is performed for each batch separately, and the function is optimized to avoid Python loops
+    by using advanced PyTorch operations.
+    Parameters:
+    x (torch.Tensor): A tensor of shape (batch_size, n, d) containing the values to be averaged.
+                      'x' should be a floating-point tensor.
+    indices (torch.Tensor): An integer tensor of shape (batch_size, n) containing the indices.
+                            The values in 'indices' should be in the range [0, z-1].
+    z (int): The number of unique indices. This determines the second dimension of the output tensor.
+    drop_mask (torch.Tensor): A boolean tensor of shape (batch_size, n) containing a mask for the indices to drop.
+                              If None, all indices are used.
+    Returns:
+    torch.Tensor: A tensor of shape (batch_size, z, d) containing the mean values for each index in each batch.
+                  If an index does not appear in a batch, its corresponding mean values are zeros.
+    Example:
+    >>> batch_size, n, d, z = 3, 4, 5, 6
+    >>> indices = torch.randint(0, z, (batch_size, n))
+    >>> x = torch.randn(batch_size, n, d)
+    >>> y = compute_means(x, indices, z)
+    >>> print(y.shape)
+    torch.Size([3, 6, 5])
+    """
+    batch_size, n, d = x.shape
+    device = x.device
+    drop = drop_mask is not None
+    # Initialize tensors to hold sums and counts
+    sums = torch.zeros(batch_size, z + int(drop), d, device=device)
+    counts = torch.zeros(batch_size, z + int(drop), device=device)
+    if drop_mask is not None:
+        # Set the values of the indices to drop to z
+        indices = indices.masked_fill(~drop_mask, z)
+    indices_expanded = indices.unsqueeze(-1).expand_as(x)
+    sums.scatter_add_(1, indices_expanded, x)
+    counts.scatter_add_(1, indices, torch.ones_like(indices, dtype=x.dtype))
+    if drop:
+        # Remove the z values from the sums and counts
+        sums = sums[:, :-1]
+        counts = counts[:, :-1]
+    # Compute the mean and handle division by zero
+    mean = sums / counts.unsqueeze(-1).clamp(min=1)
+    return mean
+def masked_mean(x, mask):
+    """
+    Computes the mean of tensor x along the x_size dimension,
+    while masking out elements where the corresponding value in the mask is False.
+    Args:
+    x (torch.Tensor): A tensor of shape (batch, x_size, z, d).
+    mask (torch.Tensor): A boolean mask of shape (batch, x_size).
+    Returns:
+    torch.Tensor: The result tensor of shape (batch, z, d) after applying the mask and computing the mean.
+    """
+    if not mask.dtype == torch.bool:
+        raise TypeError("Mask must be a boolean tensor.")
+    # Ensure the mask is broadcastable to the shape of x
+    mask = mask.unsqueeze(-1).unsqueeze(-1)
+    masked_x = x * mask
+    # Compute the sum and the count of valid (unmasked) elements along the x_size dimension
+    sum_x = masked_x.sum(dim=1)
+    count_x = mask.sum(dim=1)
+    # Avoid division by zero
+    count_x[count_x == 0] = 1
+    # Compute the mean
+    mean_x = sum_x / count_x
+    return mean_x

reflectorch/models/networks/__init__.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from reflectorch.models.networks.mlp_networks import (
+    NetworkWithPriors,
     NetworkWithPriorsConvEmb,
     NetworkWithPriorsFnoEmb,
 )
@@ -7,6 +8,7 @@ from reflectorch.models.networks.residual_net import ResidualMLP
 __all__ = [
     "ResidualMLP",
+    "NetworkWithPriors",
     "NetworkWithPriorsConvEmb",
     "NetworkWithPriorsFnoEmb",
 ]

reflectorch 1.2.1__py3-none-any.whl → 1.4.0__py3-none-any.whl

Potentially problematic release.

reflectorch 1.2.1py3-none-any.whl → 1.4.0py3-none-any.whl