PyPI - wavedl - Versions diffs - 1.5.7__py3-none-any.whl → 1.6.1__py3-none-any.whl - Mend

wavedl 1.5.7py3-none-any.whl → 1.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

wavedl/__init__.py +1 -1
wavedl/hpo.py +451 -451
wavedl/models/__init__.py +80 -4
wavedl/models/_pretrained_utils.py +366 -0
wavedl/models/base.py +48 -0
wavedl/models/caformer.py +270 -0
wavedl/models/cnn.py +2 -27
wavedl/models/convnext.py +113 -51
wavedl/models/convnext_v2.py +488 -0
wavedl/models/densenet.py +10 -23
wavedl/models/efficientnet.py +6 -6
wavedl/models/efficientnetv2.py +315 -315
wavedl/models/efficientvit.py +398 -0
wavedl/models/fastvit.py +252 -0
wavedl/models/mamba.py +555 -0
wavedl/models/maxvit.py +254 -0
wavedl/models/mobilenetv3.py +295 -295
wavedl/models/regnet.py +406 -406
wavedl/models/resnet.py +19 -61
wavedl/models/resnet3d.py +258 -258
wavedl/models/swin.py +443 -443
wavedl/models/tcn.py +393 -409
wavedl/models/unet.py +2 -6
wavedl/models/unireplknet.py +491 -0
wavedl/models/vit.py +9 -9
wavedl/train.py +1430 -1425
wavedl/utils/config.py +367 -367
wavedl/utils/cross_validation.py +530 -530
wavedl/utils/data.py +39 -6
wavedl/utils/losses.py +216 -216
wavedl/utils/optimizers.py +216 -216
wavedl/utils/schedulers.py +251 -251
{wavedl-1.5.7.dist-info → wavedl-1.6.1.dist-info}/METADATA +150 -82
wavedl-1.6.1.dist-info/RECORD +46 -0
wavedl-1.5.7.dist-info/RECORD +0 -38
{wavedl-1.5.7.dist-info → wavedl-1.6.1.dist-info}/LICENSE +0 -0
{wavedl-1.5.7.dist-info → wavedl-1.6.1.dist-info}/WHEEL +0 -0
{wavedl-1.5.7.dist-info → wavedl-1.6.1.dist-info}/entry_points.txt +0 -0
{wavedl-1.5.7.dist-info → wavedl-1.6.1.dist-info}/top_level.txt +0 -0

wavedl/models/unet.py CHANGED Viewed

@@ -22,14 +22,10 @@ from typing import Any
 import torch
 import torch.nn as nn
-from wavedl.models.base import BaseModel
+from wavedl.models.base import BaseModel, SpatialShape
 from wavedl.models.registry import register_model
-# Type alias for spatial shapes
-SpatialShape = tuple[int] | tuple[int, int] | tuple[int, int, int]
 def _get_layers(dim: int):
     """Get dimension-appropriate layer classes."""
     if dim == 1:
@@ -119,7 +115,7 @@ class UNetRegression(BaseModel):
     Uses U-Net encoder-decoder architecture with skip connections,
     then applies global pooling for standard vector regression output.
-    ~31.1M parameters (2D). Good for leveraging multi-scale features
+    ~31.0M backbone parameters (2D). Good for leveraging multi-scale features
     and skip connections for regression tasks.
     Args:

wavedl/models/unireplknet.py ADDED Viewed

@@ -0,0 +1,491 @@
+"""
+UniRepLKNet: Universal Large-Kernel ConvNet for Regression
+===========================================================
+A dimension-agnostic implementation of UniRepLKNet featuring ultra-large kernels
+(up to 31x31) for capturing long-range dependencies. Particularly effective for
+wave-based problems where spatial correlations span large distances.
+**Key Features**:
+    - Large kernels (13x13 to 31x31) via efficient decomposition
+    - Dilated small kernel reparam for efficient training
+    - SE (Squeeze-and-Excitation) attention
+    - GRN (Global Response Normalization) from ConvNeXt V2
+    - Dimension-agnostic: supports 1D, 2D, 3D inputs
+**Variants**:
+    - unireplknet_tiny: 31M params, depths [3,3,18,3], dims [80,160,320,640]
+    - unireplknet_small: 56M params, depths [3,3,27,3], dims [96,192,384,768]
+    - unireplknet_base: 97M params, depths [3,3,27,3], dims [128,256,512,1024]
+**Why Large Kernels for Wave Problems**:
+    - Dispersion curves: Long-range frequency-wavenumber correlations
+    - B-scans: Defect signatures span many pixels
+    - Time-series: Capture multiple wave periods without deep stacking
+Reference:
+    Ding, X., et al. (2024). UniRepLKNet: A Universal Perception Large-Kernel
+    ConvNet for Audio, Video, Point Cloud, Time-Series and Image Recognition.
+    CVPR 2024. https://arxiv.org/abs/2311.15599
+Author: Ductho Le (ductho.le@outlook.com)
+"""
+from typing import Any
+import torch
+import torch.nn as nn
+from wavedl.models._pretrained_utils import (
+    LayerNormNd,
+    get_conv_layer,
+    get_grn_layer,
+    get_pool_layer,
+)
+from wavedl.models.base import BaseModel, SpatialShape
+from wavedl.models.registry import register_model
+__all__ = [
+    "UniRepLKNetBase",
+    "UniRepLKNetBaseLarge",
+    "UniRepLKNetSmall",
+    "UniRepLKNetTiny",
+]
+# =============================================================================
+# LARGE KERNEL CONVOLUTION BLOCK
+# =============================================================================
+class LargeKernelConv(nn.Module):
+    """
+    Large kernel depthwise convolution.
+    Implements efficient large kernel convolutions following UniRepLKNet.
+    Uses a single large depthwise conv for simplicity and reliability.
+    """
+    def __init__(
+        self,
+        channels: int,
+        kernel_size: int,
+        dim: int = 2,
+    ):
+        super().__init__()
+        self.dim = dim
+        self.kernel_size = kernel_size
+        Conv = get_conv_layer(dim)
+        padding = kernel_size // 2
+        # Large kernel depthwise conv
+        self.conv = Conv(
+            channels,
+            channels,
+            kernel_size=kernel_size,
+            padding=padding,
+            groups=channels,
+            bias=False,
+        )
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        return self.conv(x)
+class SEBlock(nn.Module):
+    """
+    Squeeze-and-Excitation block for channel attention.
+    Adaptively recalibrates channel-wise feature responses by explicitly
+    modeling interdependencies between channels.
+    """
+    def __init__(self, channels: int, reduction: int = 4):
+        super().__init__()
+        reduced = max(channels // reduction, 8)
+        self.fc1 = nn.Linear(channels, reduced, bias=False)
+        self.fc2 = nn.Linear(reduced, channels, bias=False)
+        self.act = nn.GELU()
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        # Global average pooling
+        if x.ndim == 3:  # 1D: (B, C, L)
+            gap = x.mean(dim=2)
+        elif x.ndim == 4:  # 2D: (B, C, H, W)
+            gap = x.mean(dim=(2, 3))
+        else:  # 3D: (B, C, D, H, W)
+            gap = x.mean(dim=(2, 3, 4))
+        # FC layers
+        scale = self.act(self.fc1(gap))
+        scale = torch.sigmoid(self.fc2(scale))
+        # Reshape for broadcasting
+        if x.ndim == 3:
+            scale = scale.unsqueeze(-1)
+        elif x.ndim == 4:
+            scale = scale.unsqueeze(-1).unsqueeze(-1)
+        else:
+            scale = scale.unsqueeze(-1).unsqueeze(-1).unsqueeze(-1)
+        return x * scale
+class DropPath(nn.Module):
+    """Stochastic Depth (drop path) regularization."""
+    def __init__(self, drop_prob: float = 0.0):
+        super().__init__()
+        self.drop_prob = drop_prob
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        if self.drop_prob == 0.0 or not self.training:
+            return x
+        keep_prob = 1 - self.drop_prob
+        shape = (x.shape[0],) + (1,) * (x.ndim - 1)
+        random_tensor = keep_prob + torch.rand(shape, dtype=x.dtype, device=x.device)
+        random_tensor.floor_()
+        return x.div(keep_prob) * random_tensor
+# =============================================================================
+# UNIREPLKNET BLOCK
+# =============================================================================
+class UniRepLKNetBlock(nn.Module):
+    """
+    UniRepLKNet block with large kernel convolution, SE attention, and GRN.
+    Architecture:
+        Input → LargeKernelConv → LayerNorm → SE → Linear → GELU → GRN → Linear → Residual
+    This combines the effective receptive field of large kernels with the
+    feature recalibration of SE attention and the inter-channel competition
+    of GRN from ConvNeXt V2.
+    """
+    def __init__(
+        self,
+        dim: int,
+        spatial_dim: int,
+        kernel_size: int = 13,
+        drop_path: float = 0.0,
+        mlp_ratio: float = 4.0,
+    ):
+        super().__init__()
+        self.spatial_dim = spatial_dim
+        GRN = get_grn_layer(spatial_dim)
+        # Large kernel depthwise conv
+        self.large_kernel = LargeKernelConv(
+            dim, kernel_size=kernel_size, dim=spatial_dim
+        )
+        # Layer norm (applied in channels-last format)
+        self.norm = nn.LayerNorm(dim, eps=1e-6)
+        # SE attention
+        self.se = SEBlock(dim)
+        # MLP with expansion
+        hidden_dim = int(dim * mlp_ratio)
+        self.pwconv1 = nn.Linear(dim, hidden_dim)
+        self.act = nn.GELU()
+        self.grn = GRN(hidden_dim)
+        self.pwconv2 = nn.Linear(hidden_dim, dim)
+        # Stochastic depth
+        self.drop_path = DropPath(drop_path) if drop_path > 0.0 else nn.Identity()
+    def _to_channels_last(self, x: torch.Tensor) -> torch.Tensor:
+        """Convert from channels-first to channels-last."""
+        if self.spatial_dim == 1:
+            return x.permute(0, 2, 1)  # (B, C, L) -> (B, L, C)
+        elif self.spatial_dim == 2:
+            return x.permute(0, 2, 3, 1)  # (B, C, H, W) -> (B, H, W, C)
+        else:
+            return x.permute(0, 2, 3, 4, 1)  # (B, C, D, H, W) -> (B, D, H, W, C)
+    def _to_channels_first(self, x: torch.Tensor) -> torch.Tensor:
+        """Convert from channels-last to channels-first."""
+        if self.spatial_dim == 1:
+            return x.permute(0, 2, 1)  # (B, L, C) -> (B, C, L)
+        elif self.spatial_dim == 2:
+            return x.permute(0, 3, 1, 2)  # (B, H, W, C) -> (B, C, H, W)
+        else:
+            return x.permute(0, 4, 1, 2, 3)  # (B, D, H, W, C) -> (B, C, D, H, W)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        residual = x
+        # Large kernel conv (channels-first)
+        x = self.large_kernel(x)
+        # SE attention (channels-first)
+        x = self.se(x)
+        # LayerNorm + MLP (channels-last)
+        x = self._to_channels_last(x)
+        x = self.norm(x)
+        x = self.pwconv1(x)
+        x = self.act(x)
+        # GRN (channels-first)
+        x = self._to_channels_first(x)
+        x = self.grn(x)
+        # Final projection (channels-last)
+        x = self._to_channels_last(x)
+        x = self.pwconv2(x)
+        x = self._to_channels_first(x)
+        # Residual + drop path
+        x = residual + self.drop_path(x)
+        return x
+# =============================================================================
+# UNIREPLKNET BASE CLASS
+# =============================================================================
+class UniRepLKNetBase(BaseModel):
+    """
+    UniRepLKNet base class for regression.
+    Dimension-agnostic implementation supporting 1D, 2D, and 3D inputs.
+    Features large kernels for capturing long-range dependencies in wave data.
+    Architecture:
+        1. Stem: 4x downsampling conv
+        2. 4 stages with UniRepLKNet blocks
+        3. Downsampling between stages
+        4. Global pooling + regression head
+    """
+    def __init__(
+        self,
+        in_shape: SpatialShape,
+        out_size: int,
+        depths: list[int],
+        dims: list[int],
+        kernel_sizes: list[int] | None = None,
+        drop_path_rate: float = 0.1,
+        dropout_rate: float = 0.3,
+        **kwargs,
+    ):
+        super().__init__(in_shape, out_size)
+        self.dim = len(in_shape)
+        self.depths = depths
+        self.dims = dims
+        # Default kernel sizes: larger in early stages, smaller in later stages
+        # Early stages: large receptive field for low-level features
+        # Later stages: smaller kernels sufficient for high-level features
+        if kernel_sizes is None:
+            kernel_sizes = [31, 29, 17, 13]
+        Conv = get_conv_layer(self.dim)
+        Pool = get_pool_layer(self.dim)
+        # Stem: aggressive 4x downsampling (like ConvNeXt)
+        self.stem = nn.Sequential(
+            Conv(1, dims[0], kernel_size=4, stride=4),
+            LayerNormNd(dims[0], self.dim),
+        )
+        # Stochastic depth decay
+        dp_rates = [x.item() for x in torch.linspace(0, drop_path_rate, sum(depths))]
+        # Build stages
+        self.stages = nn.ModuleList()
+        self.downsamples = nn.ModuleList()
+        cur = 0
+        for i in range(len(depths)):
+            # Adjust kernel size for 1D (can use larger kernels)
+            # Ensure kernel size is always odd for proper same-padding
+            kernel_size = kernel_sizes[i]
+            if self.dim == 1:
+                kernel_size = min(kernel_size * 2 - 1, 63)  # Keep odd for 1D
+            stage = nn.Sequential(
+                *[
+                    UniRepLKNetBlock(
+                        dim=dims[i],
+                        spatial_dim=self.dim,
+                        kernel_size=kernel_size,
+                        drop_path=dp_rates[cur + j],
+                    )
+                    for j in range(depths[i])
+                ]
+            )
+            self.stages.append(stage)
+            cur += depths[i]
+            # Downsample between stages (except after last)
+            if i < len(depths) - 1:
+                downsample = nn.Sequential(
+                    LayerNormNd(dims[i], self.dim),
+                    Conv(dims[i], dims[i + 1], kernel_size=2, stride=2),
+                )
+                self.downsamples.append(downsample)
+        # Global pooling and head
+        self.norm = nn.LayerNorm(dims[-1], eps=1e-6)
+        self.global_pool = Pool(1)
+        self.head = nn.Sequential(
+            nn.Dropout(dropout_rate),
+            nn.Linear(dims[-1], dims[-1] // 2),
+            nn.GELU(),
+            nn.Dropout(dropout_rate * 0.5),
+            nn.Linear(dims[-1] // 2, out_size),
+        )
+        # Initialize weights
+        self._init_weights()
+    def _init_weights(self):
+        """Initialize weights with truncated normal."""
+        for m in self.modules():
+            if isinstance(m, (nn.Conv1d, nn.Conv2d, nn.Conv3d, nn.Linear)):
+                nn.init.trunc_normal_(m.weight, std=0.02)
+                if m.bias is not None:
+                    nn.init.zeros_(m.bias)
+            elif isinstance(m, nn.LayerNorm):
+                nn.init.ones_(m.weight)
+                nn.init.zeros_(m.bias)
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """
+        Forward pass.
+        Args:
+            x: Input tensor (B, 1, *in_shape)
+        Returns:
+            Output tensor (B, out_size)
+        """
+        x = self.stem(x)
+        for i, stage in enumerate(self.stages):
+            x = stage(x)
+            if i < len(self.downsamples):
+                x = self.downsamples[i](x)
+        # Global pooling
+        x = self.global_pool(x)
+        x = x.flatten(1)
+        # Final norm and head
+        x = self.norm(x)
+        x = self.head(x)
+        return x
+    @classmethod
+    def get_default_config(cls) -> dict[str, Any]:
+        return {
+            "depths": [3, 3, 18, 3],
+            "dims": [80, 160, 320, 640],
+            "kernel_sizes": [31, 29, 17, 13],
+            "drop_path_rate": 0.1,
+            "dropout_rate": 0.3,
+        }
+# =============================================================================
+# REGISTERED VARIANTS
+# =============================================================================
+@register_model("unireplknet_tiny")
+class UniRepLKNetTiny(UniRepLKNetBase):
+    """
+    UniRepLKNet Tiny: ~30.8M backbone parameters.
+    Large kernels [31, 29, 17, 13] for capturing long-range wave patterns.
+    Depths [3,3,18,3], Dims [80,160,320,640].
+    Supports 1D, 2D, 3D inputs.
+    Example:
+        >>> model = UniRepLKNetTiny(in_shape=(256, 256), out_size=3)
+        >>> x = torch.randn(4, 1, 256, 256)
+        >>> out = model(x)  # (4, 3)
+    """
+    def __init__(self, in_shape: SpatialShape, out_size: int, **kwargs):
+        super().__init__(
+            in_shape=in_shape,
+            out_size=out_size,
+            depths=[3, 3, 18, 3],
+            dims=[80, 160, 320, 640],
+            kernel_sizes=[31, 29, 17, 13],
+            **kwargs,
+        )
+    def __repr__(self) -> str:
+        return (
+            f"UniRepLKNet_Tiny({self.dim}D, in_shape={self.in_shape}, "
+            f"out_size={self.out_size})"
+        )
+@register_model("unireplknet_small")
+class UniRepLKNetSmall(UniRepLKNetBase):
+    """
+    UniRepLKNet Small: ~56.0M backbone parameters.
+    Large kernels [31, 29, 17, 13] for capturing long-range wave patterns.
+    Depths [3,3,27,3], Dims [96,192,384,768].
+    Supports 1D, 2D, 3D inputs.
+    """
+    def __init__(self, in_shape: SpatialShape, out_size: int, **kwargs):
+        super().__init__(
+            in_shape=in_shape,
+            out_size=out_size,
+            depths=[3, 3, 27, 3],
+            dims=[96, 192, 384, 768],
+            kernel_sizes=[31, 29, 17, 13],
+            **kwargs,
+        )
+    def __repr__(self) -> str:
+        return (
+            f"UniRepLKNet_Small({self.dim}D, in_shape={self.in_shape}, "
+            f"out_size={self.out_size})"
+        )
+@register_model("unireplknet_base")
+class UniRepLKNetBaseLarge(UniRepLKNetBase):
+    """
+    UniRepLKNet Base: ~97.6M backbone parameters.
+    Large kernels [31, 29, 17, 13] for capturing long-range wave patterns.
+    Depths [3,3,27,3], Dims [128,256,512,1024].
+    Supports 1D, 2D, 3D inputs.
+    """
+    def __init__(self, in_shape: SpatialShape, out_size: int, **kwargs):
+        super().__init__(
+            in_shape=in_shape,
+            out_size=out_size,
+            depths=[3, 3, 27, 3],
+            dims=[128, 256, 512, 1024],
+            kernel_sizes=[31, 29, 17, 13],
+            **kwargs,
+        )
+    def __repr__(self) -> str:
+        return (
+            f"UniRepLKNet_Base({self.dim}D, in_shape={self.in_shape}, "
+            f"out_size={self.out_size})"
+        )

wavedl/models/vit.py CHANGED Viewed

@@ -10,9 +10,9 @@ Supports both 1D (signals) and 2D (images) inputs via configurable patch embeddi
     - 2D: Images/spectrograms → patches are grid squares
 **Variants**:
-    - vit_tiny: Smallest (~5.7M params, embed_dim=192, depth=12, heads=3)
-    - vit_small: Light (~22M params, embed_dim=384, depth=12, heads=6)
-    - vit_base: Standard (~86M params, embed_dim=768, depth=12, heads=12)
+    - vit_tiny: Smallest (~5.4M backbone params, embed_dim=192, depth=12, heads=3)
+    - vit_small: Light (~21.4M backbone params, embed_dim=384, depth=12, heads=6)
+    - vit_base: Standard (~85.3M backbone params, embed_dim=768, depth=12, heads=12)
 References:
     Dosovitskiy, A., et al. (2021). An Image is Worth 16x16 Words:
@@ -27,12 +27,12 @@ from typing import Any
 import torch
 import torch.nn as nn
-from wavedl.models.base import BaseModel
+from wavedl.models.base import BaseModel, SpatialShape1D, SpatialShape2D
 from wavedl.models.registry import register_model
-# Type alias for spatial shapes
-SpatialShape = tuple[int] | tuple[int, int]
+# ViT supports 1D and 2D only
+SpatialShape = SpatialShape1D | SpatialShape2D
 class PatchEmbed(nn.Module):
@@ -365,7 +365,7 @@ class ViTTiny(ViTBase):
     """
     ViT-Tiny: Smallest Vision Transformer variant.
-    ~5.7M parameters. Good for: Quick experiments, smaller datasets.
+    ~5.4M backbone parameters. Good for: Quick experiments, smaller datasets.
     Args:
         in_shape: (L,) for 1D or (H, W) for 2D
@@ -398,7 +398,7 @@ class ViTSmall(ViTBase):
     """
     ViT-Small: Light Vision Transformer variant.
-    ~22M parameters. Good for: Balanced performance.
+    ~21.4M backbone parameters. Good for: Balanced performance.
     Args:
         in_shape: (L,) for 1D or (H, W) for 2D
@@ -429,7 +429,7 @@ class ViTBase_(ViTBase):
     """
     ViT-Base: Standard Vision Transformer variant.
-    ~86M parameters. Good for: High accuracy, larger datasets.
+    ~85.3M backbone parameters. Good for: High accuracy, larger datasets.
     Args:
         in_shape: (L,) for 1D or (H, W) for 2D

wavedl 1.5.7__py3-none-any.whl → 1.6.1__py3-none-any.whl

wavedl 1.5.7py3-none-any.whl → 1.6.1py3-none-any.whl