PyPI - alphagenome-pytorch - Versions diffs - 0.0.3__py3-none-any.whl → 0.0.5__py3-none-any.whl - Mend

alphagenome-pytorch 0.0.3py3-none-any.whl → 0.0.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

alphagenome_pytorch/alphagenome.py CHANGED Viewed

@@ -2,11 +2,11 @@ from __future__ import annotations
 from functools import partial
 import torch
-from torch import nn, cat, stack, arange
+from torch import nn, cat, stack, arange, logspace
 import torch.nn.functional as F
 from torch.nn import Linear, Sequential, Module, ModuleList
-import einx
+from einx import add, multiply, greater
 from einops.layers.torch import Rearrange, Reduce
 from einops import rearrange, repeat, einsum
@@ -15,6 +15,7 @@ from einops import rearrange, repeat, einsum
 # b - batch
 # h - heads
 # n - sequence
+# p - relative positions
 # d - feature dimension
 # constants
@@ -41,6 +42,12 @@ def default(v, d):
 def softclamp(t, value = 5.):
     return (t / value).tanh() * value
+def relative_shift(t):
+    *leading_dims, seq_len, dim = t.shape
+    t = F.pad(t, (1, 0), value = 0.)
+    t = t.reshape(*leading_dims, dim + 1, seq_len)
+    return t[..., 1:, :].reshape(*leading_dims, seq_len, dim)
 # rotary, but with attenuation of short relative distance frequencies
 class RotaryEmbedding(Module):
@@ -51,7 +58,7 @@ class RotaryEmbedding(Module):
     ):
         super().__init__()
         num_freqs = dim // 2
-        inv_freq = 1. / (arange(num_freqs).float() + torch.logspace(1, max_positions - num_freqs + 1, num_freqs))
+        inv_freq = 1. / (arange(num_freqs).float() + logspace(1, max_positions - num_freqs + 1, num_freqs))
         self.register_buffer('inv_freq', inv_freq)
     def forward(
@@ -70,6 +77,32 @@ def rotate_half(x):
 def apply_rotary_pos_emb(pos, t):
     return t * pos.cos() + rotate_half(t) * pos.sin()
+# 'central mask features' - relative positions for constituting pairwise rep
+class RelativePosFeatures(Module):
+    def __init__(self, pool_size = 16):
+        super().__init__()
+        self.pool_size = pool_size
+    def forward(self, single):
+        _, seq_len, dim = single.shape
+        seq_len //= self.pool_size
+        half_dim = dim // 2
+        rel_pos = arange(2 * seq_len - 1) - (seq_len - 1)
+        center_widths = (
+            arange(half_dim) +
+            logspace(1, seq_len - half_dim + 1, half_dim + 1)[:-1] # endpoint = False
+        )
+        abs_rel_pos, rel_pos_sign = rel_pos.abs(), rel_pos.sign()
+        embeds = greater('j, i -> i j', center_widths, abs_rel_pos).float()
+        return cat((embeds, multiply('i, i j', rel_pos_sign, embeds)), dim = -1)
 # prenorm and sandwich norm - they use sandwich norm for single rep, prenorm for pairwise rep
 class NormWrapper(Module):
@@ -90,10 +123,11 @@ class NormWrapper(Module):
     def forward(
         self,
         x,
+        *args,
         **kwargs
     ):
         x = self.pre_rmsnorm(x)
-        out = self.block(x, **kwargs)
+        out = self.block(x, *args, **kwargs)
         out = self.post_block_dropout(out)
         return self.post_rmsnorm(out)
@@ -210,7 +244,7 @@ class SingleToPairwise(Module):
         dim_inner = heads * dim_pairwise
-        self.split_heads = Rearrange('b n (h d) -> b n h d', h = heads)
+        self.split_heads = Rearrange('... (h d) -> ... h d', h = heads)
         self.to_outer_sum = Sequential(
             nn.GELU(),
@@ -220,7 +254,16 @@ class SingleToPairwise(Module):
         self.to_qk = LinearNoBias(dim, dim_inner * 2)
         self.qk_to_pairwise = Linear(heads, dim_pairwise)
-    def forward(self, single):
+        # relative position related
+        self.to_rel_pos_encoding = Linear(dim, heads * dim_pairwise)
+        self.qk_rel_pos_bias = nn.Parameter(torch.zeros(2, 1, 1, heads, dim_pairwise))
+    def forward(
+        self,
+        single,
+        rel_pos_feats = None
+    ):
         single = self.avg_pool(single)
@@ -229,11 +272,29 @@ class SingleToPairwise(Module):
         sim = einsum(q, k, 'b i h d, b j h d -> b i j h')
+        if exists(rel_pos_feats):
+            rel_pos_encoding = self.to_rel_pos_encoding(rel_pos_feats)
+            rel_pos_encoding = self.split_heads(rel_pos_encoding)
+            q_rel_bias, k_rel_bias = self.qk_rel_pos_bias
+            rel_q = relative_shift(einsum(q + q_rel_bias, rel_pos_encoding, 'b n h d, p h d -> b n p h'))
+            rel_k = relative_shift(einsum(k + k_rel_bias, rel_pos_encoding, 'b n h d, p h d -> b n p h'))
+            _, seq, rel_pos_seq, _ = rel_q.shape
+            crop_padding = (rel_pos_seq - seq) // 2
+            rel_q, rel_k = tuple(t[..., crop_padding:(crop_padding + seq), :] for t in (rel_q, rel_k))
+            rel_sim = add('b i j d, b j i d -> b i j d', rel_q, rel_k) * 0.5
+            sim = sim + rel_sim
         pairwise_from_sim = self.qk_to_pairwise(sim)
         outer_q, outer_k = self.to_outer_sum(single).chunk(2, dim = -1)
-        outer_sum = einx.add('b i d, b j d -> b i j d', outer_q, outer_k)
+        outer_sum = add('b i d, b j d -> b i j d', outer_q, outer_k)
         return outer_sum
@@ -304,6 +365,7 @@ class TransformerTower(Module):
         dim_pairwise = None,
         pairwise_every_num_single_blocks = 2,   # how often to do a pairwise block
         single_to_pairwise_heads = 32,          # they did 32
+        pool_size = 16,
         attn_kwargs: dict = dict(),
         ff_kwargs: dict = dict()
     ):
@@ -314,6 +376,8 @@ class TransformerTower(Module):
         self.pairwise_every = pairwise_every_num_single_blocks
+        self.rel_pos_features = RelativePosFeatures(pool_size)
         self.rotary_emb = RotaryEmbedding(dim_head_qk, max_positions = max_positions)
         for layer_index in range(depth):
@@ -330,7 +394,7 @@ class TransformerTower(Module):
             single_to_pairwise, pairwise_attn, pairwise_ff = None, None, None
             if divisible_by(layer_index, self.pairwise_every):
-                single_to_pairwise = SingleToPairwise(dim = dim, dim_pairwise = dim_pairwise, heads = single_to_pairwise_heads)
+                single_to_pairwise = SingleToPairwise(dim = dim, dim_pairwise = dim_pairwise, heads = single_to_pairwise_heads, pool_size = pool_size)
                 pairwise_attn = PairwiseRowAttention(dim_pairwise)
                 pairwise_ff = FeedForward(dim = dim_pairwise, expansion_factor = ff_expansion_factor)
@@ -360,6 +424,8 @@ class TransformerTower(Module):
         pairwise = None
+        rel_pos_feats = self.rel_pos_features(single)
         rotary_emb = self.rotary_emb(seq_len)
         for (
@@ -374,7 +440,7 @@ class TransformerTower(Module):
             single = ff(single) + single
             if exists(maybe_single_to_pair):
-                pairwise = maybe_single_to_pair(single) + default(pairwise, 0.)
+                pairwise = maybe_single_to_pair(single, rel_pos_feats) + default(pairwise, 0.)
                 pairwise = maybe_pairwise_attn(pairwise) + pairwise
                 pairwise = maybe_pairwise_ff(pairwise) + pairwise

{alphagenome_pytorch-0.0.3.dist-info → alphagenome_pytorch-0.0.5.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: alphagenome-pytorch
-Version: 0.0.3
+Version: 0.0.5
 Summary: AlphaGenome
 Project-URL: Homepage, https://pypi.org/project/alphagenome-pytorch/
 Project-URL: Repository, https://github.com/lucidrains/alphagenome

alphagenome_pytorch-0.0.5.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+alphagenome_pytorch/__init__.py,sha256=7plC_YRm0UapNCl9hJEhFxXE-ELGKVy-DtuO5GUQxGI,101
+alphagenome_pytorch/alphagenome.py,sha256=5uxmx-x-6KSu-2aUF4AxM-rYSxXuwnr-0meTNhu2vUM,14086
+alphagenome_pytorch-0.0.5.dist-info/METADATA,sha256=0W6pkI9-RvNCOixhC1ius8a4-cwpTx7gsA370FLmnsY,3386
+alphagenome_pytorch-0.0.5.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+alphagenome_pytorch-0.0.5.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
+alphagenome_pytorch-0.0.5.dist-info/RECORD,,

alphagenome_pytorch-0.0.3.dist-info/RECORD DELETED Viewed

@@ -1,6 +0,0 @@
-alphagenome_pytorch/__init__.py,sha256=7plC_YRm0UapNCl9hJEhFxXE-ELGKVy-DtuO5GUQxGI,101
-alphagenome_pytorch/alphagenome.py,sha256=ynMieMVxKkL-BFr9yyAku4J48P4gaRAc0z0GmThTot0,11818
-alphagenome_pytorch-0.0.3.dist-info/METADATA,sha256=uKEwowc-D-OO5pZ_JU176e1AIB7o_-pKbKJRiyF0WO0,3386
-alphagenome_pytorch-0.0.3.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-alphagenome_pytorch-0.0.3.dist-info/licenses/LICENSE,sha256=1yCiA9b5nhslTavxPjsQAO-wpOnwJR9-l8LTVi7GJuk,1066
-alphagenome_pytorch-0.0.3.dist-info/RECORD,,

{alphagenome_pytorch-0.0.3.dist-info → alphagenome_pytorch-0.0.5.dist-info}/WHEEL RENAMED Viewed

File without changes

{alphagenome_pytorch-0.0.3.dist-info → alphagenome_pytorch-0.0.5.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

alphagenome-pytorch 0.0.3__py3-none-any.whl → 0.0.5__py3-none-any.whl

alphagenome-pytorch 0.0.3py3-none-any.whl → 0.0.5py3-none-any.whl