~7% speedup (1.57 to 1.69it/s) from switch to += in ldm.modules.attention. (#482)

mh-dm · web-flow · commit 62863ac58619 · 2022-09-10T09:58:07.000-04:00
Tested on 8GB eGPU nvidia setup so YMMV.
512x512 output, max VRAM stays same.
diff --git a/ldm/modules/attention.py b/ldm/modules/attention.py
@@ -235,9 +235,9 @@ def forward(self, x, context=None):
 
     def _forward(self, x, context=None):
         x = x.contiguous() if x.device.type == 'mps' else x
-        x = self.attn1(self.norm1(x)) + x
-        x = self.attn2(self.norm2(x), context=context) + x
-        x = self.ff(self.norm3(x)) + x
+        x += self.attn1(self.norm1(x))
+        x += self.attn2(self.norm2(x), context=context)
+        x += self.ff(self.norm3(x))
         return x