PyPI - hyper-connections - Versions diffs - 0.0.16__tar.gz → 0.0.18__tar.gz - Mend

hyper-connections 0.0.16tar.gz → 0.0.18tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: hyper-connections
-Version: 0.0.16
+Version: 0.0.18
 Summary: Hyper-Connections
 Project-URL: Homepage, https://pypi.org/project/hyper-connections/
 Project-URL: Repository, https://github.com/lucidrains/hyper-connections

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/hyper_connections/hyper_connections.py RENAMED Viewed

@@ -86,7 +86,8 @@ class HyperConnections(Module):
         branch: Module | None = None,
         layer_index = None,
         tanh = True,
-        channel_first = False
+        channel_first = False,
+        dropout = 0.
     ):
         """
         Appendix J, Algorithm2 in - https://arxiv.org/abs/2409.19606
@@ -116,6 +117,10 @@ class HyperConnections(Module):
         self.dynamic_beta_fn = nn.Parameter(torch.zeros(dim))
         self.dynamic_beta_scale = nn.Parameter(torch.ones(()) * 1e-2)
+        # dropouts
+        self.dropout = nn.Dropout(dropout)
         # channel first option
         self.channel_first = channel_first
@@ -184,7 +189,7 @@ class HyperConnections(Module):
         if self.channel_first:
             output = rearrange(output, 'b ... d -> b d ...')
-        return output
+        return self.dropout(output)
     def decorate_branch(self, branch: Callable):
         assert not exists(self.branch), 'branch was already wrapped on init'

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/hyper_connections/hyper_connections_with_multi_branch_inputs.py RENAMED Viewed

@@ -6,8 +6,8 @@ from random import randrange
 import torch
 from torch import nn
-from torch.nn import Module
 import torch.nn.functional as F
+from torch.nn import Module, ModuleList
 from torch.utils._pytree import tree_flatten, tree_unflatten
 from einops import rearrange, repeat, reduce, einsum
@@ -22,6 +22,9 @@ def exists(v):
 def default(v, d):
     return v if exists(v) else d
+def divisible_by(num, den):
+    return (num % den) == 0
 def identity(t):
     return t
@@ -35,10 +38,11 @@ class HyperConnections(Module):
         num_residual_streams,
         *,
         dim,
-        branch: Module | None = None,
+        branch: Module | tuple[Module, ...] | list[Module] | None = None,
         layer_index = None,
         tanh = True,
         channel_first = False,
+        dropout = 0.,
         num_branch_inputs = 1  # residuals will be linearly combined to multiple inputs, fed through the branch, then linearly combined back out to residuals
     ):
         """
@@ -46,7 +50,15 @@ class HyperConnections(Module):
         """
         super().__init__()
-        self.branch = branch
+        self.branches = None
+        if isinstance(branch, Module):
+            branch = [branch]
+        if exists(branch):
+            assert divisible_by(num_branch_inputs, len(branch))
+            self.branches = ModuleList(branch)
         # activation, seemingly results were wishy washy depending on using tanh or not
@@ -78,6 +90,10 @@ class HyperConnections(Module):
         self.dynamic_beta_fn = nn.Parameter(torch.zeros(dim, num_branch_inputs))
         self.dynamic_beta_scale = nn.Parameter(torch.ones(()) * 1e-2)
+        # dropout
+        self.dropout = nn.Dropout(dropout)
         # channel first option
         self.channel_first = channel_first
@@ -153,15 +169,24 @@ class HyperConnections(Module):
         if self.channel_first:
             output = rearrange(output, 'b ... d -> b d ...')
-        return output
+        return self.dropout(output)
-    def decorate_branch(self, branch: Callable):
-        assert not exists(self.branch), 'branch was already wrapped on init'
+    def decorate_branch(self, branch: Callable | tuple[Callable, ...] | list[Callable]):
+        assert not exists(self.branches), 'branch was already wrapped on init'
         def forward_and_add_residual(residual, *args, **kwargs):
             branch_input, add_residual = self.forward(residual)
-            branch_output = branch(branch_input, *args, **kwargs)
+            if callable(branch):
+                branches = [branch]
+            else:
+                branches = branch
+            branch_inputs = rearrange(branch_input, '(br b) ... -> br b ...', br = len(branches))
+            branch_outputs = [fn(x, *args, **kwargs) for fn, x in zip(branches, branch_inputs)]
+            branch_output = torch.cat(branch_outputs)
             residual = add_residual(branch_output)
@@ -180,9 +205,13 @@ class HyperConnections(Module):
             return tree_unflatten((branch_out, *rest), tree_spec)
-        if not exists(self.branch):
+        if not exists(self.branches):
             return branch_input, add_residual_fn
-        branch_output = self.branch(branch_input, *branch_args, **branch_kwargs)
+        branch_inputs = rearrange(branch_input, '(br b) ... -> br b ...', br = len(self.branches))
+        branch_outputs = [fn(x, *branch_args, **branch_kwargs) for fn, x in zip(self.branches, branch_inputs)]
+        branch_output = torch.cat(branch_outputs)
         return add_residual_fn(branch_output)

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "hyper-connections"
-version = "0.0.16"
+version = "0.0.18"
 description = "Hyper-Connections"
 authors = [
     { name = "Phil Wang", email = "lucidrains@gmail.com" }

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/.github/workflows/python-publish.yml RENAMED Viewed

File without changes

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/.gitignore RENAMED Viewed

File without changes

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/LICENSE RENAMED Viewed

File without changes

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/README.md RENAMED Viewed

File without changes

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/hyper-connections.png RENAMED Viewed

File without changes

{hyper_connections-0.0.16 → hyper_connections-0.0.18}/hyper_connections/__init__.py RENAMED Viewed

File without changes

hyper-connections 0.0.16__tar.gz → 0.0.18__tar.gz

hyper-connections 0.0.16tar.gz → 0.0.18tar.gz