PyPI - hippoformer - Versions diffs - 0.0.8__tar.gz → 0.0.9__tar.gz - Mend

hippoformer 0.0.8tar.gz → 0.0.9tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

{hippoformer-0.0.8 → hippoformer-0.0.9}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: hippoformer
-Version: 0.0.8
+Version: 0.0.9
 Summary: hippoformer
 Project-URL: Homepage, https://pypi.org/project/hippoformer/
 Project-URL: Repository, https://github.com/lucidrains/hippoformer

{hippoformer-0.0.8 → hippoformer-0.0.9}/hippoformer/hippoformer.py RENAMED Viewed

@@ -38,6 +38,40 @@ def pack_with_inverse(t, pattern):
 def l2norm(t):
     return F.normalize(t, dim = -1)
+# Muon - Jordan et al from oss community - applied to the latest version of titans
+def newtonschulz5(
+    t,
+    steps = 5,
+    eps = 1e-7,
+    coefs = (3.4445, -4.7750, 2.0315)
+):
+    not_weights = t.ndim <= 3
+    if not_weights:
+        return t
+    shape = t.shape
+    should_transpose = shape[-2] > shape[-1]
+    if should_transpose:
+        t = t.transpose(-1, -2)
+    t, inv_pack = pack_with_inverse(t, '* i j')
+    t = t / t.norm(dim = (-1, -2), keepdim = True).clamp(min = eps)
+    a, b, c = coefs
+    for _ in range(steps):
+        A = t @ t.transpose(-1, -2)
+        B = b * A + c * A @ A
+        t = a * t + B @ t
+    if should_transpose:
+        t = t.transpose(-1, -2)
+    return inv_pack(t)
 # sensory encoder decoder for 2d
 grid_sensory_enc_dec = (
@@ -209,6 +243,7 @@ class mmTEM(Module):
         loss_weight_consistency = 1.,
         loss_weight_relational = 1.,
         integration_ratio_learned = True,
+        muon_update = False,
         assoc_scan_kwargs: dict = dict()
     ):
         super().__init__()
@@ -287,6 +322,10 @@ class mmTEM(Module):
         self.loss_weight_consistency = loss_weight_consistency
         self.register_buffer('zero', tensor(0.), persistent = False)
+        # update with muon
+        self.muon_update = muon_update
         # there is an integration ratio for error correction, but unclear what value this is fixed to or whether it is learned
         self.integration_ratio = nn.Parameter(tensor(0.), requires_grad = integration_ratio_learned)
@@ -416,6 +455,13 @@ class mmTEM(Module):
             update = self.assoc_scan(grad, expanded_beta.sigmoid(), momentum)
+            # maybe muon
+            if self.muon_update:
+                update = newtonschulz5(update)
+            # with forget gating
             expanded_forget = repeat(forget, 'b t -> b t w', w = grad.shape[-1])
             acc_update = self.assoc_scan(update, expanded_forget.sigmoid())

{hippoformer-0.0.8 → hippoformer-0.0.9}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "hippoformer"
-version = "0.0.8"
+version = "0.0.9"
 description = "hippoformer"
 authors = [
     { name = "Phil Wang", email = "lucidrains@gmail.com" }

{hippoformer-0.0.8 → hippoformer-0.0.9}/tests/test_hippoformer.py RENAMED Viewed

@@ -16,8 +16,10 @@ def test_path_integrate():
     assert structure_codes.shape == (2, 16, 64)
 @param('sensory_type', ('naive', '2d', '3d'))
+@param('muon_update', (True, False))
 def test_mm_tem(
-    sensory_type
+    sensory_type,
+    muon_update
 ):
     import torch
     from hippoformer.hippoformer import mmTEM
@@ -52,7 +54,8 @@ def test_mm_tem(
         dim_sensory = 11,
         dim_action = 7,
         dim_structure = 32,
-        dim_encoded_sensory = 32
+        dim_encoded_sensory = 32,
+        muon_update = muon_update
     )
     actions = torch.randn(2, 16, 7)

{hippoformer-0.0.8 → hippoformer-0.0.9}/.github/workflows/python-publish.yml RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/.github/workflows/test.yml RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/.gitignore RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/LICENSE RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/README.md RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/hippoformer/__init__.py RENAMED Viewed

File without changes

{hippoformer-0.0.8 → hippoformer-0.0.9}/hippoformer-fig6.png RENAMED Viewed

File without changes

hippoformer 0.0.8__tar.gz → 0.0.9__tar.gz

hippoformer 0.0.8tar.gz → 0.0.9tar.gz