new strategy for repeat consecutive, to get ready for more efficient local attention atom transformer biasing

lucidrains · lucidrains · commit 8f9e41d094ac · 2024-05-28T10:01:18.000-07:00
diff --git a/alphafold3_pytorch/alphafold3.py b/alphafold3_pytorch/alphafold3.py
@@ -151,10 +151,7 @@ def repeat_consecutive_with_lens(
     lens: Int['b n'],
 ) -> Float['b m ...'] | Bool['b m']:
 
-    is_bool = feats.dtype == torch.bool
-    feats = feats.float()
-
-    device = feats.device
+    device, dtype = feats.device, feats.dtype
 
     batch, seq, *dims = feats.shape
 
@@ -174,25 +171,38 @@ def repeat_consecutive_with_lens(
     # create output tensor + a sink position on the very right (index max_len)
 
     total_lens = lens.sum(dim = -1)
+    output_mask = lens_to_mask(total_lens)
+
     max_len = total_lens.amax()
 
-    output = torch.zeros((batch, max_len + 1, *dims), device = device)
+    output_indices = torch.zeros((batch, max_len + 1), device = device, dtype = torch.long)
 
     indices.masked_fill_(~mask, max_len) # scatter to sink position for padding
     indices = rearrange(indices, 'b n w -> b (n w)')
 
-    feats = repeat(feats, 'b n ... -> b (n w) ...', w = window_size)
-
     # scatter
 
-    output = einx.set_at('b [m] ...,  b nw, b nw ... -> b [m] ...', output, indices, feats)
+    seq_arange = torch.arange(seq, device = device)
+    seq_arange = repeat(seq_arange, 'n -> (n w)', w = window_size)
+
+    output_indices = einx.set_at('b [m],  b nw, nw -> b [m]', output_indices, indices, seq_arange)
 
     # remove sink
 
-    output = output[:, :-1]
+    output_indices = output_indices[:, :-1]
+
+    # gather
+
+    output = einx.get_at('b [n] ..., b m -> b m ...', feats, output_indices)
+
+    # final mask
+
+    mask_value = False if dtype == torch.bool else 0
 
-    if is_bool:
-        output = output.bool()
+    output = einx.where(
+        'b n, b n ..., -> b n ...',
+        output_mask, output, mask_value
+    )
 
     return output
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "alphafold3-pytorch"
-version = "0.0.48"
+version = "0.0.49"
 description = "Alphafold 3 - Pytorch"
 authors = [
     { name = "Phil Wang", email = "lucidrains@gmail.com" }