PyPI - flaxdiff - Versions diffs - 0.1.35.4__tar.gz → 0.1.35.6__tar.gz - Mend

flaxdiff 0.1.35.4tar.gz → 0.1.35.6tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: flaxdiff
-Version: 0.1.35.4
+Version: 0.1.35.6
 Summary: A versatile and easy to understand Diffusion library
 Author: Ashish Kumar Singh
 Author-email: ashishkmr472@gmail.com

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/attention.py RENAMED Viewed

@@ -11,6 +11,7 @@ import einops
 import functools
 import math
 from .common import kernel_init
+import jax.experimental.pallas.ops.tpu.flash_attention
 class EfficientAttention(nn.Module):
     """
@@ -303,27 +304,30 @@ class TransformerBlock(nn.Module):
     only_pure_attention:bool = False
     force_fp32_for_softmax: bool = True
     kernel_init: Callable = kernel_init(1.0)
+    norm_inputs: bool = True
+    explicitly_add_residual: bool = True
     @nn.compact
     def __call__(self, x, context=None):
         inner_dim = self.heads * self.dim_head
         C = x.shape[-1]
-        normed_x = nn.RMSNorm(epsilon=1e-5, dtype=self.dtype)(x)
+        if self.norm_inputs:
+            x = nn.RMSNorm(epsilon=1e-5, dtype=self.dtype)(x)
         if self.use_projection == True:
             if self.use_linear_attention:
                 projected_x = nn.Dense(features=inner_dim,
                                        use_bias=False, precision=self.precision,
                                        kernel_init=self.kernel_init,
-                                       dtype=self.dtype, name=f'project_in')(normed_x)
+                                       dtype=self.dtype, name=f'project_in')(x)
             else:
                 projected_x = nn.Conv(
                     features=inner_dim, kernel_size=(1, 1),
                     kernel_init=self.kernel_init,
                     strides=(1, 1), padding='VALID', use_bias=False, dtype=self.dtype,
                     precision=self.precision, name=f'project_in_conv',
-                )(normed_x)
+                )(x)
         else:
-            projected_x = normed_x
+            projected_x = x
             inner_dim = C
         context = projected_x if context is None else context
@@ -356,6 +360,9 @@ class TransformerBlock(nn.Module):
                     strides=(1, 1), padding='VALID', use_bias=False, dtype=self.dtype,
                     precision=self.precision, name=f'project_out_conv',
                 )(projected_x)
-        out = x + projected_x
+        if self.only_pure_attention or self.explicitly_add_residual:
+            projected_x = x + projected_x
+        out = projected_x
         return out

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/simple_unet.py RENAMED Viewed

@@ -50,7 +50,7 @@ class Unet(nn.Module):
             features=self.feature_depths[0],
             kernel_size=(3, 3),
             strides=(1, 1),
-            kernel_init=self.kernel_init(1.0),
+            kernel_init=self.kernel_init(scale=1.0),
             dtype=self.dtype,
             precision=self.precision
         )(x)
@@ -65,7 +65,7 @@ class Unet(nn.Module):
                     down_conv_type,
                     name=f"down_{i}_residual_{j}",
                     features=dim_in,
-                    kernel_init=self.kernel_init(1.0),
+                    kernel_init=self.kernel_init(scale=1.0),
                     kernel_size=(3, 3),
                     strides=(1, 1),
                     activation=self.activation,
@@ -83,7 +83,9 @@ class Unet(nn.Module):
                                         precision=attention_config.get("precision", self.precision),
                                         only_pure_attention=attention_config.get("only_pure_attention", True),
                                         force_fp32_for_softmax=attention_config.get("force_fp32_for_softmax", False),
-                                        kernel_init=self.kernel_init(1.0),
+                                        norm_inputs=attention_config.get("norm_inputs", True),
+                                        explicitly_add_residual=attention_config.get("explicitly_add_residual", True),
+                                        kernel_init=self.kernel_init(scale=1.0),
                                         name=f"down_{i}_attention_{j}")(x, textcontext)
                 # print("down residual for feature level", i, "is of shape", x.shape, "features", dim_in)
                 downs.append(x)
@@ -106,7 +108,7 @@ class Unet(nn.Module):
                 middle_conv_type,
                 name=f"middle_res1_{j}",
                 features=middle_dim_out,
-                kernel_init=self.kernel_init(1.0),
+                kernel_init=self.kernel_init(scale=1.0),
                 kernel_size=(3, 3),
                 strides=(1, 1),
                 activation=self.activation,
@@ -125,13 +127,15 @@ class Unet(nn.Module):
                                     precision=middle_attention.get("precision", self.precision),
                                     only_pure_attention=middle_attention.get("only_pure_attention", True),
                                     force_fp32_for_softmax=middle_attention.get("force_fp32_for_softmax", False),
-                                    kernel_init=self.kernel_init(1.0),
+                                    norm_inputs=middle_attention.get("norm_inputs", True),
+                                    explicitly_add_residual=middle_attention.get("explicitly_add_residual", True),
+                                    kernel_init=self.kernel_init(scale=1.0),
                                     name=f"middle_attention_{j}")(x, textcontext)
             x = ResidualBlock(
                 middle_conv_type,
                 name=f"middle_res2_{j}",
                 features=middle_dim_out,
-                kernel_init=self.kernel_init(1.0),
+                kernel_init=self.kernel_init(scale=1.0),
                 kernel_size=(3, 3),
                 strides=(1, 1),
                 activation=self.activation,
@@ -153,7 +157,7 @@ class Unet(nn.Module):
                     up_conv_type,# if j == 0 else "separable",
                     name=f"up_{i}_residual_{j}",
                     features=dim_out,
-                    kernel_init=self.kernel_init(1.0),
+                    kernel_init=self.kernel_init(scale=1.0),
                     kernel_size=kernel_size,
                     strides=(1, 1),
                     activation=self.activation,
@@ -171,7 +175,9 @@ class Unet(nn.Module):
                                         precision=attention_config.get("precision", self.precision),
                                         only_pure_attention=attention_config.get("only_pure_attention", True),
                                         force_fp32_for_softmax=middle_attention.get("force_fp32_for_softmax", False),
-                                        kernel_init=self.kernel_init(1.0),
+                                        norm_inputs=attention_config.get("norm_inputs", True),
+                                        explicitly_add_residual=attention_config.get("explicitly_add_residual", True),
+                                        kernel_init=self.kernel_init(scale=1.0),
                                         name=f"up_{i}_attention_{j}")(x, textcontext)
             # print("Upscaling ", i, x.shape)
             if i != len(feature_depths) - 1:
@@ -190,7 +196,7 @@ class Unet(nn.Module):
             features=self.feature_depths[0],
             kernel_size=(3, 3),
             strides=(1, 1),
-            kernel_init=self.kernel_init(1.0),
+            kernel_init=self.kernel_init(scale=1.0),
             dtype=self.dtype,
             precision=self.precision
         )(x)
@@ -201,7 +207,7 @@ class Unet(nn.Module):
             conv_type,
             name="final_residual",
             features=self.feature_depths[0],
-            kernel_init=self.kernel_init(1.0),
+            kernel_init=self.kernel_init(scale=1.0),
             kernel_size=(3,3),
             strides=(1, 1),
             activation=self.activation,
@@ -220,7 +226,7 @@ class Unet(nn.Module):
             kernel_size=(3, 3),
             strides=(1, 1),
             # activation=jax.nn.mish
-            kernel_init=self.kernel_init(0.0),
+            kernel_init=self.kernel_init(scale=0.0),
             dtype=self.dtype,
             precision=self.precision
         )(x)

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/simple_vit.py RENAMED Viewed

@@ -69,6 +69,8 @@ class UViT(nn.Module):
     precision: PrecisionLike = None
     kernel_init: Callable = partial(kernel_init, scale=1.0)
     add_residualblock_output: bool = False
+    norm_inputs: bool = False
+    explicitly_add_residual: bool = True
     def setup(self):
         if self.norm_groups > 0:
@@ -110,16 +112,20 @@ class UViT(nn.Module):
         for i in range(self.num_layers // 2):
             x = TransformerBlock(heads=self.num_heads, dim_head=self.emb_features // self.num_heads,
                                  dtype=self.dtype, precision=self.precision, use_projection=self.use_projection,
-                                 use_flash_attention=self.use_flash_attention, use_self_and_cross=self.use_self_and_cross, force_fp32_for_softmax=self.force_fp32_for_softmax,
+                                 use_flash_attention=self.use_flash_attention, use_self_and_cross=False, force_fp32_for_softmax=self.force_fp32_for_softmax,
                                  only_pure_attention=False,
+                                 norm_inputs=self.norm_inputs,
+                                 explicitly_add_residual=self.explicitly_add_residual,
                                  kernel_init=self.kernel_init())(x)
             skips.append(x)
         # Middle block
         x = TransformerBlock(heads=self.num_heads, dim_head=self.emb_features // self.num_heads,
                              dtype=self.dtype, precision=self.precision, use_projection=self.use_projection,
-                             use_flash_attention=self.use_flash_attention, use_self_and_cross=self.use_self_and_cross, force_fp32_for_softmax=self.force_fp32_for_softmax,
+                             use_flash_attention=self.use_flash_attention, use_self_and_cross=False, force_fp32_for_softmax=self.force_fp32_for_softmax,
                              only_pure_attention=False,
+                            norm_inputs=self.norm_inputs,
+                            explicitly_add_residual=self.explicitly_add_residual,
                              kernel_init=self.kernel_init())(x)
         # # Out blocks
@@ -131,6 +137,8 @@ class UViT(nn.Module):
                                  dtype=self.dtype, precision=self.precision, use_projection=self.use_projection,
                                  use_flash_attention=self.use_flash_attention, use_self_and_cross=self.use_self_and_cross, force_fp32_for_softmax=self.force_fp32_for_softmax,
                                  only_pure_attention=False,
+                                 norm_inputs=self.norm_inputs,
+                                 explicitly_add_residual=self.explicitly_add_residual,
                                  kernel_init=self.kernel_init())(x)
         # print(f'Shape of x after transformer blocks: {x.shape}')

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: flaxdiff
-Version: 0.1.35.4
+Version: 0.1.35.6
 Summary: A versatile and easy to understand Diffusion library
 Author: Ashish Kumar Singh
 Author-email: ashishkmr472@gmail.com

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/setup.py RENAMED Viewed

@@ -11,7 +11,7 @@ required_packages=[
 setup(
     name='flaxdiff',
     packages=find_packages(),
-    version='0.1.35.4',
+    version='0.1.35.6',
     description='A versatile and easy to understand Diffusion library',
     long_description=open('README.md').read(),
     long_description_content_type='text/markdown',

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/README.md RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/data/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/data/online_loader.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/autoencoder/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/autoencoder/autoencoder.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/autoencoder/diffusers.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/autoencoder/simple_autoenc.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/common.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/models/favor_fastattn.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/predictors/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/common.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/ddim.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/ddpm.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/euler.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/heun_sampler.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/multistep_dpm.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/samplers/rk4_sampler.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/common.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/continuous.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/cosine.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/discrete.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/exp.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/karras.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/linear.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/schedulers/sqrt.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/trainer/__init__.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/trainer/autoencoder_trainer.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/trainer/diffusion_trainer.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/trainer/simple_trainer.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff/utils.py RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff.egg-info/SOURCES.txt RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff.egg-info/requires.txt RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/flaxdiff.egg-info/top_level.txt RENAMED Viewed

File without changes

{flaxdiff-0.1.35.4 → flaxdiff-0.1.35.6}/setup.cfg RENAMED Viewed

File without changes

flaxdiff 0.1.35.4__tar.gz → 0.1.35.6__tar.gz

flaxdiff 0.1.35.4tar.gz → 0.1.35.6tar.gz