PyPI - wavedl - Versions diffs - 1.5.3__tar.gz → 1.5.4__tar.gz - Mend

wavedl 1.5.3tar.gz → 1.5.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

{wavedl-1.5.3/src/wavedl.egg-info → wavedl-1.5.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: wavedl
-Version: 1.5.3
+Version: 1.5.4
 Summary: A Scalable Deep Learning Framework for Wave-Based Inverse Problems
 Author: Ductho Le
 License: MIT
@@ -37,11 +37,12 @@ Requires-Dist: wandb>=0.15.0
 Requires-Dist: optuna>=3.0.0
 Requires-Dist: onnx>=1.14.0
 Requires-Dist: onnxruntime>=1.15.0
-Requires-Dist: pytest>=7.0.0
-Requires-Dist: pytest-xdist>=3.5.0
-Requires-Dist: ruff>=0.8.0
-Requires-Dist: pre-commit>=3.5.0
 Requires-Dist: triton>=2.0.0; sys_platform == "linux"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0.0; extra == "dev"
+Requires-Dist: pytest-xdist>=3.5.0; extra == "dev"
+Requires-Dist: ruff>=0.8.0; extra == "dev"
+Requires-Dist: pre-commit>=3.5.0; extra == "dev"
 <div align="center">
@@ -204,7 +205,7 @@ Deploy models anywhere:
 pip install wavedl
 ```
-This installs everything you need: training, inference, HPO, ONNX export, and dev tools.
+This installs everything you need: training, inference, HPO, ONNX export.
 #### From Source (for development)
@@ -336,7 +337,7 @@ class MyModel(BaseModel):
 **Step 2: Train**
 ```bash
-wavedl-hpc --import my_model --model my_model --data_path train.npz
+wavedl-hpc --import my_model.py --model my_model --data_path train.npz
 ```
 WaveDL handles everything else: training loop, logging, checkpoints, multi-GPU, early stopping, etc.
@@ -512,7 +513,7 @@ print('\\n✓ All pretrained weights cached!')
 | Argument | Default | Description |
 |----------|---------|-------------|
 | `--model` | `cnn` | Model architecture |
-| `--import` | - | Python modules to import (for custom models) |
+| `--import` | - | Python file(s) to import for custom models (supports multiple) |
 | `--batch_size` | `128` | Per-GPU batch size |
 | `--lr` | `1e-3` | Learning rate |
 | `--epochs` | `1000` | Maximum epochs |
@@ -1223,6 +1224,6 @@ This research was enabled in part by support provided by [Compute Ontario](https
 [![Google Scholar](https://img.shields.io/badge/Google_Scholar-4285F4?style=plastic&logo=google-scholar&logoColor=white)](https://scholar.google.ca/citations?user=OlwMr9AAAAAJ)
 [![ResearchGate](https://img.shields.io/badge/ResearchGate-00CCBB?style=plastic&logo=researchgate&logoColor=white)](https://www.researchgate.net/profile/Ductho-Le)
-<sub>Released under the MIT License</sub>
+<sub>May your signals be strong and your attenuation low 👋</sub>
 </div>

{wavedl-1.5.3 → wavedl-1.5.4}/README.md RENAMED Viewed

@@ -159,7 +159,7 @@ Deploy models anywhere:
 pip install wavedl
 ```
-This installs everything you need: training, inference, HPO, ONNX export, and dev tools.
+This installs everything you need: training, inference, HPO, ONNX export.
 #### From Source (for development)
@@ -291,7 +291,7 @@ class MyModel(BaseModel):
 **Step 2: Train**
 ```bash
-wavedl-hpc --import my_model --model my_model --data_path train.npz
+wavedl-hpc --import my_model.py --model my_model --data_path train.npz
 ```
 WaveDL handles everything else: training loop, logging, checkpoints, multi-GPU, early stopping, etc.
@@ -467,7 +467,7 @@ print('\\n✓ All pretrained weights cached!')
 | Argument | Default | Description |
 |----------|---------|-------------|
 | `--model` | `cnn` | Model architecture |
-| `--import` | - | Python modules to import (for custom models) |
+| `--import` | - | Python file(s) to import for custom models (supports multiple) |
 | `--batch_size` | `128` | Per-GPU batch size |
 | `--lr` | `1e-3` | Learning rate |
 | `--epochs` | `1000` | Maximum epochs |
@@ -1178,6 +1178,6 @@ This research was enabled in part by support provided by [Compute Ontario](https
 [![Google Scholar](https://img.shields.io/badge/Google_Scholar-4285F4?style=plastic&logo=google-scholar&logoColor=white)](https://scholar.google.ca/citations?user=OlwMr9AAAAAJ)
 [![ResearchGate](https://img.shields.io/badge/ResearchGate-00CCBB?style=plastic&logo=researchgate&logoColor=white)](https://www.researchgate.net/profile/Ductho-Le)
-<sub>Released under the MIT License</sub>
+<sub>May your signals be strong and your attenuation low 👋</sub>
 </div>

{wavedl-1.5.3 → wavedl-1.5.4}/pyproject.toml RENAMED Viewed

@@ -70,13 +70,16 @@ dependencies = [
     # ONNX export
     "onnx>=1.14.0",
     "onnxruntime>=1.15.0",
-    # Development tools
+    # torch.compile backend (Linux only)
+    "triton>=2.0.0; sys_platform == 'linux'",
+]
+[project.optional-dependencies]
+dev = [
     "pytest>=7.0.0",
     "pytest-xdist>=3.5.0",
     "ruff>=0.8.0",
     "pre-commit>=3.5.0",
-    # torch.compile backend (Linux only)
-    "triton>=2.0.0; sys_platform == 'linux'",
 ]
 [project.scripts]

{wavedl-1.5.3 → wavedl-1.5.4}/src/wavedl/__init__.py RENAMED Viewed

@@ -18,7 +18,7 @@ For inference:
     # or: python -m wavedl.test --checkpoint best_checkpoint --data_path test.npz
 """
-__version__ = "1.5.3"
+__version__ = "1.5.4"
 __author__ = "Ductho Le"
 __email__ = "ductho.le@outlook.com"

{wavedl-1.5.3 → wavedl-1.5.4}/src/wavedl/models/swin.py RENAMED Viewed

@@ -191,22 +191,33 @@ class SwinTransformerBase(BaseModel):
         Returns:
             List of parameter group dictionaries
         """
-        # Separate parameters: head (full LR) vs backbone (decayed LR)
+        # Separate parameters into 4 groups for proper LR decay:
+        # 1. Head params with decay (full LR)
+        # 2. Backbone params with decay (0.1× LR)
+        # 3. Head bias/norm without decay (full LR)
+        # 4. Backbone bias/norm without decay (0.1× LR)
         head_params = []
         backbone_params = []
-        no_decay_params = []
+        head_no_decay = []
+        backbone_no_decay = []
         for name, param in self.backbone.named_parameters():
             if not param.requires_grad:
                 continue
-            # No weight decay for bias and normalization
-            if "bias" in name or "norm" in name:
-                no_decay_params.append(param)
-            elif "head" in name:
-                head_params.append(param)
+            is_head = "head" in name
+            is_no_decay = "bias" in name or "norm" in name
+            if is_head:
+                if is_no_decay:
+                    head_no_decay.append(param)
+                else:
+                    head_params.append(param)
             else:
-                backbone_params.append(param)
+                if is_no_decay:
+                    backbone_no_decay.append(param)
+                else:
+                    backbone_params.append(param)
         groups = []
@@ -229,15 +240,25 @@ class SwinTransformerBase(BaseModel):
                 }
             )
-        if no_decay_params:
+        if head_no_decay:
             groups.append(
                 {
-                    "params": no_decay_params,
+                    "params": head_no_decay,
                     "lr": base_lr,
                     "weight_decay": 0.0,
                 }
             )
+        if backbone_no_decay:
+            # Backbone bias/norm also gets 0.1× LR to match intended decay
+            groups.append(
+                {
+                    "params": backbone_no_decay,
+                    "lr": base_lr * 0.1,
+                    "weight_decay": 0.0,
+                }
+            )
         return groups if groups else [{"params": self.parameters(), "lr": base_lr}]

{wavedl-1.5.3 → wavedl-1.5.4}/src/wavedl/train.py RENAMED Viewed

@@ -122,6 +122,7 @@ import matplotlib.pyplot as plt
 import numpy as np
 import pandas as pd
 import torch
+import torch.distributed as dist
 from accelerate import Accelerator
 from accelerate.utils import set_seed
 from sklearn.metrics import r2_score
@@ -470,15 +471,19 @@ def main():
             try:
                 # Handle both module names (my_model) and file paths (./my_model.py)
                 if module_name.endswith(".py"):
-                    # Import from file path
+                    # Import from file path with unique module name
                     import importlib.util
+                    # Derive unique module name from filename to avoid collisions
+                    base_name = os.path.splitext(os.path.basename(module_name))[0]
+                    unique_name = f"wavedl_custom_{base_name}"
                     spec = importlib.util.spec_from_file_location(
-                        "custom_module", module_name
+                        unique_name, module_name
                     )
                     if spec and spec.loader:
                         module = importlib.util.module_from_spec(spec)
-                        sys.modules["custom_module"] = module
+                        sys.modules[unique_name] = module
                         spec.loader.exec_module(module)
                         print(f"✓ Imported custom module from: {module_name}")
                 else:
@@ -1250,9 +1255,32 @@ def main():
                     )
             # Learning rate scheduling (epoch-based schedulers only)
+            # NOTE: For ReduceLROnPlateau with DDP, we must step only on main process
+            # to avoid patience counter being incremented by all GPU processes.
+            # Then we sync the new LR to all processes to keep them consistent.
             if not scheduler_step_per_batch:
                 if args.scheduler == "plateau":
-                    scheduler.step(avg_val_loss)
+                    # Step only on main process to avoid multi-GPU patience bug
+                    if accelerator.is_main_process:
+                        scheduler.step(avg_val_loss)
+                    # Sync LR across all processes after main process updates it
+                    accelerator.wait_for_everyone()
+                    # Broadcast new LR from rank 0 to all processes
+                    if dist.is_initialized():
+                        if accelerator.is_main_process:
+                            new_lr = optimizer.param_groups[0]["lr"]
+                        else:
+                            new_lr = 0.0
+                        new_lr_tensor = torch.tensor(
+                            new_lr, device=accelerator.device, dtype=torch.float32
+                        )
+                        dist.broadcast(new_lr_tensor, src=0)
+                        # Update LR on non-main processes
+                        if not accelerator.is_main_process:
+                            for param_group in optimizer.param_groups:
+                                param_group["lr"] = new_lr_tensor.item()
                 else:
                     scheduler.step()

{wavedl-1.5.3 → wavedl-1.5.4}/src/wavedl/utils/data.py RENAMED Viewed

@@ -793,6 +793,14 @@ def load_test_data(
                     raise KeyError(
                         f"Input key not found. Tried: {custom_input_keys}. Found: {keys}"
                     )
+                # OOM guard: warn if dataset is very large
+                n_samples = f[inp_key].shape[0]
+                if n_samples > 100000:
+                    raise ValueError(
+                        f"Dataset has {n_samples:,} samples. load_test_data() loads "
+                        f"everything into RAM which may cause OOM. For large inference "
+                        f"sets, use a DataLoader with HDF5Source.load_mmap() instead."
+                    )
                 inp = f[inp_key][:]
                 outp = f[out_key][:] if out_key else None
         elif format == "mat":
@@ -805,6 +813,14 @@ def load_test_data(
                     raise KeyError(
                         f"Input key not found. Tried: {custom_input_keys}. Found: {keys}"
                     )
+                # OOM guard: warn if dataset is very large (MAT is transposed)
+                n_samples = f[inp_key].shape[-1]
+                if n_samples > 100000:
+                    raise ValueError(
+                        f"Dataset has {n_samples:,} samples. load_test_data() loads "
+                        f"everything into RAM which may cause OOM. For large inference "
+                        f"sets, use a DataLoader with MATSource.load_mmap() instead."
+                    )
                 inp = mat_source._load_dataset(f, inp_key)
                 if out_key:
                     outp = mat_source._load_dataset(f, out_key)
@@ -1126,6 +1142,17 @@ def prepare_data(
     if not cache_exists:
         if accelerator.is_main_process:
+            # Delete stale cache files to force regeneration
+            # This prevents silent reuse of old data when metadata invalidates cache
+            for stale_file in [CACHE_FILE, SCALER_FILE]:
+                if os.path.exists(stale_file):
+                    try:
+                        os.remove(stale_file)
+                        logger.debug(f"   Removed stale cache: {stale_file}")
+                    except OSError as e:
+                        logger.warning(
+                            f"   Failed to remove stale cache {stale_file}: {e}"
+                        )
             # RANK 0: Create cache (can take a long time for large datasets)
             # Other ranks will wait at the barrier below

{wavedl-1.5.3 → wavedl-1.5.4/src/wavedl.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: wavedl
-Version: 1.5.3
+Version: 1.5.4
 Summary: A Scalable Deep Learning Framework for Wave-Based Inverse Problems
 Author: Ductho Le
 License: MIT
@@ -37,11 +37,12 @@ Requires-Dist: wandb>=0.15.0
 Requires-Dist: optuna>=3.0.0
 Requires-Dist: onnx>=1.14.0
 Requires-Dist: onnxruntime>=1.15.0
-Requires-Dist: pytest>=7.0.0
-Requires-Dist: pytest-xdist>=3.5.0
-Requires-Dist: ruff>=0.8.0
-Requires-Dist: pre-commit>=3.5.0
 Requires-Dist: triton>=2.0.0; sys_platform == "linux"
+Provides-Extra: dev
+Requires-Dist: pytest>=7.0.0; extra == "dev"
+Requires-Dist: pytest-xdist>=3.5.0; extra == "dev"
+Requires-Dist: ruff>=0.8.0; extra == "dev"
+Requires-Dist: pre-commit>=3.5.0; extra == "dev"
 <div align="center">
@@ -204,7 +205,7 @@ Deploy models anywhere:
 pip install wavedl
 ```
-This installs everything you need: training, inference, HPO, ONNX export, and dev tools.
+This installs everything you need: training, inference, HPO, ONNX export.
 #### From Source (for development)
@@ -336,7 +337,7 @@ class MyModel(BaseModel):
 **Step 2: Train**
 ```bash
-wavedl-hpc --import my_model --model my_model --data_path train.npz
+wavedl-hpc --import my_model.py --model my_model --data_path train.npz
 ```
 WaveDL handles everything else: training loop, logging, checkpoints, multi-GPU, early stopping, etc.
@@ -512,7 +513,7 @@ print('\\n✓ All pretrained weights cached!')
 | Argument | Default | Description |
 |----------|---------|-------------|
 | `--model` | `cnn` | Model architecture |
-| `--import` | - | Python modules to import (for custom models) |
+| `--import` | - | Python file(s) to import for custom models (supports multiple) |
 | `--batch_size` | `128` | Per-GPU batch size |
 | `--lr` | `1e-3` | Learning rate |
 | `--epochs` | `1000` | Maximum epochs |
@@ -1223,6 +1224,6 @@ This research was enabled in part by support provided by [Compute Ontario](https
 [![Google Scholar](https://img.shields.io/badge/Google_Scholar-4285F4?style=plastic&logo=google-scholar&logoColor=white)](https://scholar.google.ca/citations?user=OlwMr9AAAAAJ)
 [![ResearchGate](https://img.shields.io/badge/ResearchGate-00CCBB?style=plastic&logo=researchgate&logoColor=white)](https://www.researchgate.net/profile/Ductho-Le)
-<sub>Released under the MIT License</sub>
+<sub>May your signals be strong and your attenuation low 👋</sub>
 </div>

{wavedl-1.5.3 → wavedl-1.5.4}/src/wavedl.egg-info/requires.txt RENAMED Viewed

@@ -14,10 +14,12 @@ wandb>=0.15.0
 optuna>=3.0.0
 onnx>=1.14.0
 onnxruntime>=1.15.0
+[:sys_platform == "linux"]
+triton>=2.0.0
+[dev]
 pytest>=7.0.0
 pytest-xdist>=3.5.0
 ruff>=0.8.0
 pre-commit>=3.5.0
-[:sys_platform == "linux"]
-triton>=2.0.0