Implement attention mask on xformers.

2024-01-06 04:33:03 -05:00 · 2024-01-06 04:33:03 -05:00 · 3ad0191bfb
commit 3ad0191bfb
parent af94eb14e3
1 changed files with 7 additions and 4 deletions
--- a/comfy/ldm/modules/attention.py
+++ b/comfy/ldm/modules/attention.py
@ -294,11 +294,14 @@ def attention_xformers(q, k, v, heads, mask=None):
        (q, k, v),
    )
-    # actually compute the attention, what we cannot get enough of
+    if mask is not None:
-    out = xformers.ops.memory_efficient_attention(q, k, v, attn_bias=None)
+        pad = 8 - q.shape[1] % 8
        mask_out = torch.empty([q.shape[0], q.shape[1], q.shape[1] + pad], dtype=q.dtype, device=q.device)
        mask_out[:, :, :mask.shape[-1]] = mask
        mask = mask_out[:, :, :mask.shape[-1]]
    out = xformers.ops.memory_efficient_attention(q, k, v, attn_bias=mask)
    if exists(mask):
        raise NotImplementedError
    out = (
        out.unsqueeze(0)
        .reshape(b, heads, -1, dim_head)