fix enable memory efficient attention on ROCm

tenpercent · tenpercent · commit bfc1dd40db6a · 2025-01-13T22:34:24.000Z
while calling CK implementation
diff --git a/src/diffusers/models/attention_processor.py b/src/diffusers/models/attention_processor.py
@@ -399,11 +399,8 @@ def set_use_memory_efficient_attention_xformers(
             else:
                 try:
                     # Make sure we can run the memory efficient attention
-                    _ = xformers.ops.memory_efficient_attention(
-                        torch.randn((1, 2, 40), device="cuda"),
-                        torch.randn((1, 2, 40), device="cuda"),
-                        torch.randn((1, 2, 40), device="cuda"),
-                    )
+                    q = torch.randn((1, 2, 40), device="cuda", dtype=torch.float16)
+                    _ = xformers.ops.memory_efficient_attention(q, q, q)
                 except Exception as e:
                     raise e