PyPI - hippoformer - Versions diffs - 0.0.5__py3-none-any.whl → 0.0.6__py3-none-any.whl - Mend

hippoformer 0.0.5py3-none-any.whl → 0.0.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

hippoformer/hippoformer.py CHANGED Viewed

@@ -7,7 +7,8 @@ from torch.nn import Module
 from torch.jit import ScriptModule, script_method
 from torch.func import vmap, grad, functional_call
-from einops import repeat, rearrange
+from einx import multiply
+from einops import repeat, rearrange, pack, unpack
 from einops.layers.torch import Rearrange
 from x_mlps_pytorch import create_mlp
@@ -22,6 +23,16 @@ def exists(v):
 def default(v, d):
     return v if exists(v) else d
+def pack_with_inverse(t, pattern):
+    packed, packed_shape = pack([t], pattern)
+    def inverse(out, inv_pattern = None):
+        inv_pattern = default(inv_pattern, pattern)
+        unpacked, = unpack(out, packed_shape, inv_pattern)
+        return unpacked
+    return packed, inverse
 def l2norm(t):
     return F.normalize(t, dim = -1)
@@ -121,7 +132,8 @@ class mmTEM(Module):
         loss_weight_inference = 1.,
         loss_weight_consistency = 1.,
         loss_weight_relational = 1.,
-        integration_ratio_learned = True
+        integration_ratio_learned = True,
+        assoc_scan_kwargs: dict = dict()
     ):
         super().__init__()
@@ -150,6 +162,9 @@ class mmTEM(Module):
         self.to_keys = nn.Linear(dim_joint_rep, dim, bias = False)
         self.to_values = nn.Linear(dim_joint_rep, dim, bias = False)
+        self.to_learned_optim_hparams = nn.Linear(dim_joint_rep, 3, bias = False) # for learning rate, forget gate, and momentum
+        self.assoc_scan = AssocScan(*assoc_scan_kwargs)
         self.meta_memory_mlp = create_mlp(
             dim = dim * 2,
             depth = meta_mlp_depth,
@@ -217,6 +232,8 @@ class mmTEM(Module):
         actions,
         return_losses = False
     ):
+        batch = actions.shape[0]
         structural_codes = self.path_integrator(actions)
         encoded_sensory = self.sensory_encoder(sensory)
@@ -272,7 +289,43 @@ class mmTEM(Module):
         keys = self.to_keys(joint_code_to_store)
         values = self.to_values(joint_code_to_store)
-        grads = self.per_sample_grad_fn(dict(self.meta_memory_mlp.named_parameters()), keys, values)
+        lr, forget, beta = self.to_learned_optim_hparams(joint_code_to_store).unbind(dim = -1)
+        params = dict(self.meta_memory_mlp.named_parameters())
+        grads = self.per_sample_grad_fn(params, keys, values)
+        # update the meta mlp parameters
+        init_momentums = {k: zeros_like(v) for k, v in params.items()}
+        next_params = dict()
+        for (
+            (key, param),
+            (_, grad),
+            (_, init_momentum)
+        ) in zip(
+            params.items(),
+            grads.items(),
+            init_momentums.items()
+        ):
+            grad, inverse_pack = pack_with_inverse(grad, 'b t *')
+            grad = multiply('b t ..., b t', grad, lr)
+            expanded_beta = repeat(beta, 'b t -> b t w', w = grad.shape[-1])
+            init_momentum = repeat(init_momentum, '... -> b ...', b = batch)
+            update = self.assoc_scan(grad, expanded_beta.sigmoid(), init_momentum)
+            expanded_forget = repeat(forget, 'b t -> b t w', w = grad.shape[-1])
+            acc_update = self.assoc_scan(update, expanded_forget.sigmoid())
+            acc_update = inverse_pack(acc_update)
+            next_params[key] = param - acc_update[:, -1]
         # losses

{hippoformer-0.0.5.dist-info → hippoformer-0.0.6.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: hippoformer
-Version: 0.0.5
+Version: 0.0.6
 Summary: hippoformer
 Project-URL: Homepage, https://pypi.org/project/hippoformer/
 Project-URL: Repository, https://github.com/lucidrains/hippoformer
@@ -36,6 +36,7 @@ Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
 Requires-Python: >=3.9
 Requires-Dist: assoc-scan
 Requires-Dist: einops>=0.8.1
+Requires-Dist: einx>=0.3.0
 Requires-Dist: torch>=2.4
 Requires-Dist: x-mlps-pytorch
 Provides-Extra: examples

hippoformer-0.0.6.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+hippoformer/__init__.py,sha256=A7N8GsRAZH4yP-L5hb7IVDnNjnhfjNyolg5MZ6vnGyE,71
+hippoformer/hippoformer.py,sha256=b6EXU2VXh_ZD7brxpCVNuU-m7cE-zXRR-sOmqfofPCg,10839
+hippoformer-0.0.6.dist-info/METADATA,sha256=ufTBdu8ZGggxwfgzphYV56jjaGdI5sLCE_iZF5Bku6s,2800
+hippoformer-0.0.6.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+hippoformer-0.0.6.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
+hippoformer-0.0.6.dist-info/RECORD,,

hippoformer-0.0.5.dist-info/RECORD DELETED Viewed

@@ -1,6 +0,0 @@
-hippoformer/__init__.py,sha256=A7N8GsRAZH4yP-L5hb7IVDnNjnhfjNyolg5MZ6vnGyE,71
-hippoformer/hippoformer.py,sha256=PP2KmTygOP6MyYuhmr_8iEBbywIaTW4TpoIycYRugMo,9142
-hippoformer-0.0.5.dist-info/METADATA,sha256=83iG4F_6ibQy6XSCWht-aF2ZVYmiEq-KSF4XR9YaBtY,2773
-hippoformer-0.0.5.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-hippoformer-0.0.5.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
-hippoformer-0.0.5.dist-info/RECORD,,

{hippoformer-0.0.5.dist-info → hippoformer-0.0.6.dist-info}/WHEEL RENAMED Viewed

File without changes

{hippoformer-0.0.5.dist-info → hippoformer-0.0.6.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

hippoformer 0.0.5__py3-none-any.whl → 0.0.6__py3-none-any.whl

hippoformer 0.0.5py3-none-any.whl → 0.0.6py3-none-any.whl