PyPI - lt-tensor - Versions diffs - 0.0.1a22__py3-none-any.whl → 0.0.1a27__py3-none-any.whl - Mend

lt-tensor 0.0.1a22py3-none-any.whl → 0.0.1a27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

lt_tensor/config_templates.py +9 -5
lt_tensor/misc_utils.py +15 -3
lt_tensor/model_base.py +57 -78
lt_tensor/model_zoo/audio_models/diffwave/__init__.py +41 -14
lt_tensor/model_zoo/audio_models/hifigan/__init__.py +40 -82
lt_tensor/model_zoo/audio_models/istft/__init__.py +41 -83
lt_tensor/model_zoo/convs.py +124 -0
lt_tensor/model_zoo/residual.py +1 -136
lt_tensor/processors/__init__.py +2 -2
lt_tensor/processors/audio.py +267 -200
{lt_tensor-0.0.1a22.dist-info → lt_tensor-0.0.1a27.dist-info}/METADATA +1 -1
{lt_tensor-0.0.1a22.dist-info → lt_tensor-0.0.1a27.dist-info}/RECORD +15 -16
lt_tensor/model_zoo/audio_models/bigvgan/__init__.py +0 -536
lt_tensor/model_zoo/audio_models/bigvgan/cuda/__init__.py +0 -160
{lt_tensor-0.0.1a22.dist-info → lt_tensor-0.0.1a27.dist-info}/WHEEL +0 -0
{lt_tensor-0.0.1a22.dist-info → lt_tensor-0.0.1a27.dist-info}/licenses/LICENSE +0 -0
{lt_tensor-0.0.1a22.dist-info → lt_tensor-0.0.1a27.dist-info}/top_level.txt +0 -0

lt_tensor/model_zoo/audio_models/istft/__init__.py CHANGED Viewed

@@ -1,11 +1,11 @@
 __all__ = ["iSTFTNetGenerator", "iSTFTNetConfig"]
 from lt_utils.common import *
 from lt_tensor.torch_commons import *
-from lt_tensor.model_zoo.residual import ConvNets
+from lt_tensor.model_zoo.convs import ConvNets
 from torch.nn import functional as F
 from lt_tensor.config_templates import ModelConfig
+from lt_tensor.misc_utils import get_config, get_weights
 from lt_utils.file_ops import load_json, is_file, is_dir, is_path_valid
-from huggingface_hub import hf_hub_download
 class iSTFTNetConfig(ModelConfig):
@@ -39,7 +39,7 @@ class iSTFTNetConfig(ModelConfig):
             [1, 3, 5],
         ],
         activation: nn.Module = nn.LeakyReLU(0.1),
-        resblock: int = 0,
+        resblock: Union[int, str] = "1",
         gen_istft_n_fft: int = 16,
         sampling_rate: Number = 24000,
         *args,
@@ -59,7 +59,11 @@ class iSTFTNetConfig(ModelConfig):
         }
         super().__init__(**settings)
+    def post_process(self):
+        if isinstance(self.resblock, str):
+            self.resblock = 0 if self.resblock == "1" else 1
 def get_padding(ks, d):
     return int((ks * d - d) / 2)
@@ -271,15 +275,15 @@ class iSTFTNetGenerator(ConvNets):
     def load_weights(
         self,
         path,
-        raise_if_not_exists=False,
         strict=False,
         assign=False,
-        weights_only=True,
+        weights_only=False,
         mmap=None,
+        raise_if_not_exists=False,
         **pickle_load_args,
     ):
         try:
-            return super().load_weights(
+            incompatible_keys = super().load_weights(
                 path,
                 raise_if_not_exists,
                 strict,
@@ -288,6 +292,18 @@ class iSTFTNetGenerator(ConvNets):
                 mmap,
                 **pickle_load_args,
             )
+            if incompatible_keys:
+                self.remove_norms()
+                incompatible_keys = super().load_weights(
+                    path,
+                    raise_if_not_exists,
+                    strict,
+                    assign,
+                    weights_only,
+                    mmap,
+                    **pickle_load_args,
+                )
+            return incompatible_keys
         except RuntimeError:
             self.remove_norms()
             return super().load_weights(
@@ -303,95 +319,37 @@ class iSTFTNetGenerator(ConvNets):
     @classmethod
     def from_pretrained(
         cls,
-        model_id: str,
-        map_location: str = "cpu",
-        local_files_only: bool = False,
-        strict: bool = False,
+        model_file: PathLike,
+        model_config: Union[iSTFTNetConfig, Dict[str, Any]],
         *,
-        subfolder: str | None = None,
-        repo_type: str | None = None,
-        revision: str | None = None,
-        cache_dir: str | Path | None = None,
-        force_download: bool = False,
-        proxies: Dict | None = None,
-        token: bool | str | None = None,
-        resume_download: bool | None = None,
-        local_dir_use_symlinks: bool | Literal["auto"] = "auto",
+        strict: bool = False,
+        map_location: str = "cpu",
+        weights_only: bool = False,
         **kwargs,
     ):
-        """Load Pytorch pretrained weights and return the loaded model."""
-        hub_kwargs = dict(
-            repo_id=model_id,
-            subfolder=subfolder,
-            repo_type=repo_type,
-            revision=revision,
-            cache_dir=cache_dir,
-            force_download=force_download,
-            proxies=proxies,
-            resume_download=resume_download,
-            token=token,
-            local_files_only=local_files_only,
-            local_dir_use_symlinks=local_dir_use_symlinks,
-        )
-        # Download and load hyperparameters (h) used by BigVGAN
-        _model_path = Path(model_id)
-        config_file = None
-        if is_path_valid(model_id):
-            if is_file(model_id):
-                _p_conf = _model_path.parent / "config.json"
-            else:
-                _p_conf = _model_path / "config.json"
-            if is_file(_p_conf):
-                print("Loading config.json from local directory")
-                config_file = Path(model_id, "config.json")
-            else:
-                if not local_files_only:
-                    print(f"Loading config from {model_id}")
-                    config_file = hf_hub_download(filename="config.json", **hub_kwargs)
-        else:
-            if not local_files_only:
-                print(f"Loading config from {model_id}")
-                config_file = hf_hub_download(filename="config.json", **hub_kwargs)
-        if config_file is not None:
-            model = cls(iSTFTNetConfig(**load_json(config_file)))
-        else:
-            model = cls()
-        # Download and load pretrained generator weight
-        _retrieve_kwargs = dict(
-            **hub_kwargs,
-            filename="generator.pt",
+        is_file(model_file, validate=True)
+        model_state_dict = torch.load(
+            model_file, weights_only=weights_only, map_location=map_location
         )
-        path = Path(model_id)
-        if path.exists():
-            if path.is_dir():
-                path = path / "generator.pt"
-                if path.exists():
-                    print("Loading weights from local directory")
-                    model_file = str(path)
-                else:
-                    print(f"Loading weights from {model_id}")
-                    model_file = hf_hub_download(**_retrieve_kwargs)
-            else:
-                print("Loading weights from local directory")
-                model_file = str(path)
+        if isinstance(model_config, iSTFTNetConfig):
+            h = model_config
         else:
-            print(f"Loading weights from {model_id}")
-            model_file = hf_hub_download(**_retrieve_kwargs)
-        checkpoint_dict = torch.load(model_file, map_location=map_location)
+            h = iSTFTNetConfig(**model_config)
+        model = cls(h)
         try:
-            model.load_state_dict(checkpoint_dict, strict=strict)
+            incompatible_keys = model.load_state_dict(model_state_dict, strict=strict)
+            if incompatible_keys:
+                model.remove_norms()
+                model.load_state_dict(model_state_dict, strict=strict)
         except RuntimeError:
             print(
                 f"[INFO] the pretrained checkpoint does not contain weight norm. Loading the checkpoint after removing weight norm!"
             )
             model.remove_norms()
-            model.load_state_dict(checkpoint_dict, strict=strict)
+            model.load_state_dict(model_state_dict, strict=strict)
         return model

lt_tensor/model_zoo/convs.py ADDED Viewed

@@ -0,0 +1,124 @@
+__all__ = ["ConvNets", "Conv1dEXT"]
+import math
+from lt_utils.common import *
+import torch.nn.functional as F
+from lt_tensor.torch_commons import *
+from lt_tensor.model_base import Model
+from lt_tensor.misc_utils import log_tensor
+from lt_tensor.model_zoo.fusion import AdaFusion1D, AdaIN1D
+def spectral_norm_select(module: nn.Module, enabled: bool):
+    if enabled:
+        return spectral_norm(module)
+    return module
+def get_weight_norm(norm_type: Optional[Literal["weight", "spectral"]] = None):
+    if not norm_type:
+        return lambda x: x
+    if norm_type == "weight":
+        return lambda x: weight_norm(x)
+    return lambda x: spectral_norm(x)
+def remove_norm(module, name: str = "weight"):
+    try:
+        try:
+            remove_parametrizations(module, name, leave_parametrized=False)
+        except:
+            # many times will fail with 'leave_parametrized'
+            remove_parametrizations(module, name)
+    except ValueError:
+        pass  # not parametrized
+class ConvNets(Model):
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+    def remove_norms(self, name: str = "weight"):
+        for module in self.modules():
+            if "Conv" in module.__class__.__name__:
+                remove_norm(module, name)
+    @staticmethod
+    def init_weights(
+        m: nn.Module,
+        norm: Optional[Literal["spectral", "weight"]] = None,
+        mean=0.0,
+        std=0.02,
+        name: str = "weight",
+        n_power_iterations: int = 1,
+        eps: float = 1e-9,
+        dim_sn: Optional[int] = None,
+        dim_wn: int = 0,
+    ):
+        if "Conv" in m.__class__.__name__:
+            if norm is not None:
+                try:
+                    if norm == "spectral":
+                        m.apply(
+                            lambda m: spectral_norm(
+                                m,
+                                n_power_iterations=n_power_iterations,
+                                eps=eps,
+                                name=name,
+                                dim=dim_sn,
+                            )
+                        )
+                    else:
+                        m.apply(lambda m: weight_norm(m, name=name, dim=dim_wn))
+                except ValueError:
+                    pass
+            m.weight.data.normal_(mean, std)
+class Conv1dEXT(ConvNets):
+    def __init__(
+        self,
+        in_channels: int,
+        out_channels: Optional[int] = None,
+        kernel_size: Union[int, Tuple[int, ...]] = 1,
+        stride: Union[int, Tuple[int, ...]] = 1,
+        padding: Union[int, Tuple[int, ...]] = 0,
+        dilation: Union[int, Tuple[int, ...]] = 1,
+        groups: int = 1,
+        bias: bool = True,
+        padding_mode: str = "zeros",
+        device: Optional[Any] = None,
+        dtype: Optional[Any] = None,
+        apply_norm: Optional[Literal["weight", "spectral"]] = None,
+        activation: nn.Module = nn.Identity(),
+        *args,
+        **kwargs,
+    ):
+        super().__init__(*args, **kwargs)
+        if not out_channels:
+            out_channels = in_channels
+        cnn_kwargs = dict(
+            in_channels=in_channels,
+            out_channels=out_channels,
+            kernel_size=kernel_size,
+            stride=stride,
+            padding=padding,
+            dilation=dilation,
+            groups=groups,
+            bias=bias,
+            padding_mode=padding_mode,
+            device=device,
+            dtype=dtype,
+        )
+        if apply_norm is None:
+            self.cnn = nn.Conv1d(**cnn_kwargs)
+        else:
+            if apply_norm == "spectral":
+                self.cnn = spectral_norm(nn.Conv1d(**cnn_kwargs))
+            else:
+                self.cnn = weight_norm(nn.Conv1d(**cnn_kwargs))
+        self.activation = activation
+        self.cnn.apply(self.init_weights)
+    def forward(self, input: Tensor):
+        return self.cnn(self.activation(input))

lt_tensor/model_zoo/residual.py CHANGED Viewed

@@ -2,12 +2,10 @@ __all__ = [
     "spectral_norm_select",
     "get_weight_norm",
     "ResBlock1D",
-    "ResBlock2D",
     "ResBlock1DShuffled",
     "AdaResBlock1D",
     "ResBlocks1D",
     "ResBlock1D2",
-    "ShuffleBlock2D",
 ]
 import math
 from lt_utils.common import *
@@ -16,73 +14,7 @@ from lt_tensor.torch_commons import *
 from lt_tensor.model_base import Model
 from lt_tensor.misc_utils import log_tensor
 from lt_tensor.model_zoo.fusion import AdaFusion1D, AdaIN1D
-def spectral_norm_select(module: nn.Module, enabled: bool):
-    if enabled:
-        return spectral_norm(module)
-    return module
-def get_weight_norm(norm_type: Optional[Literal["weight", "spectral"]] = None):
-    if not norm_type:
-        return lambda x: x
-    if norm_type == "weight":
-        return lambda x: weight_norm(x)
-    return lambda x: spectral_norm(x)
-def remove_norm(module, name: str = "weight"):
-    try:
-        try:
-            remove_parametrizations(module, name, leave_parametrized=False)
-        except:
-            # many times will fail with 'leave_parametrized'
-            remove_parametrizations(module, name)
-    except ValueError:
-        pass  # not parametrized
-class ConvNets(Model):
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-    def remove_norms(self, name: str = "weight"):
-        for module in self.modules():
-            if "Conv" in module.__class__.__name__:
-                remove_norm(module, name)
-    @staticmethod
-    def init_weights(
-        m: nn.Module,
-        norm: Optional[Literal["spectral", "weight"]] = None,
-        mean=0.0,
-        std=0.02,
-        name: str = "weight",
-        n_power_iterations: int = 1,
-        eps: float = 1e-9,
-        dim_sn: Optional[int] = None,
-        dim_wn: int = 0,
-    ):
-        if "Conv" in m.__class__.__name__:
-            if norm is not None:
-                try:
-                    if norm == "spectral":
-                        m.apply(
-                            lambda m: spectral_norm(
-                                m,
-                                n_power_iterations=n_power_iterations,
-                                eps=eps,
-                                name=name,
-                                dim=dim_sn,
-                            )
-                        )
-                    else:
-                        m.apply(lambda m: weight_norm(m, name=name, dim=dim_wn))
-                except ValueError:
-                    pass
-            m.weight.data.normal_(mean, std)
+from lt_tensor.model_zoo.convs import ConvNets
 def get_padding(ks, d):
@@ -151,7 +83,6 @@ class ResBlock1DShuffled(ConvNets):
         self.last_index = len(self.conv_nets) - 1
     def _get_conv_layer(self, id, ch, k, stride, d, actv):
-        get_padding = lambda ks, d: int((ks * d - d) / 2)
         return nn.Sequential(
             actv,  # 1
             weight_norm(
@@ -172,72 +103,6 @@ class ResBlock1DShuffled(ConvNets):
         return x
-class ResBlock2D(Model):
-    def __init__(
-        self,
-        in_channels: int,
-        out_channels: Optional[int] = None,
-        hidden_dim: int = 32,
-        downscale: bool = False,
-        activation: nn.Module = nn.LeakyReLU(0.2),
-    ):
-        super().__init__()
-        stride = 2 if downscale else 1
-        if out_channels is None:
-            out_channels = in_channels
-        self.block = nn.Sequential(
-            nn.Conv2d(in_channels, hidden_dim, 3, stride, 1),
-            activation,
-            nn.Conv2d(hidden_dim, hidden_dim, 7, 1, 3),
-            activation,
-            nn.Conv2d(hidden_dim, out_channels, 3, 1, 1),
-        )
-        self.skip = nn.Identity()
-        if downscale or in_channels != out_channels:
-            self.skip = spectral_norm_select(
-                nn.Conv2d(in_channels, out_channels, 1, stride)
-            )
-        # on less to be handled every cycle
-        self.sqrt_2 = math.sqrt(2)
-    def forward(self, x: Tensor):
-        return x + ((self.block(x) + self.skip(x)) / self.sqrt_2)
-class ShuffleBlock2D(ConvNets):
-    def __init__(
-        self,
-        channels: int,
-        out_channels: Optional[int] = None,
-        hidden_dim: int = 32,
-        downscale: bool = False,
-        activation: nn.Module = nn.LeakyReLU(0.1),
-    ):
-        super().__init__()
-        if out_channels is None:
-            out_channels = channels
-        self.shuffle = nn.ChannelShuffle(groups=2)
-        self.ch_split = lambda tensor: torch.split(tensor, 1, dim=1)
-        self.activation = activation
-        self.resblock_2d = ResBlock2D(
-            channels, out_channels, hidden_dim, downscale, activation
-        )
-    def shuffle_channels(self, tensor: torch.Tensor):
-        with torch.no_grad():
-            x = F.channel_shuffle(tensor.transpose(1, -1), tensor.shape[1]).transpose(
-                -1, 1
-            )
-        return self.ch_split(x)
-    def forward(self, x: torch.Tensor):
-        ch1, ch2 = self.shuffle_channels(x)
-        ch2 = self.resblock_2d(ch2)
-        return torch.cat((ch1, ch2), dim=1)
 class AdaResBlock1D(ConvNets):
     def __init__(
         self,

lt_tensor/processors/__init__.py CHANGED Viewed

@@ -1,3 +1,3 @@
-from .audio import AudioProcessor
+from .audio import AudioProcessor, AudioProcessorConfig
-__all__ = ["AudioProcessor"]
+__all__ = ["AudioProcessor", "AudioProcessorConfig"]

lt-tensor 0.0.1a22__py3-none-any.whl → 0.0.1a27__py3-none-any.whl

lt-tensor 0.0.1a22py3-none-any.whl → 0.0.1a27py3-none-any.whl