wan: Delete the self attention before cross attention

This saves VRAM when the cross attention and FFN are in play as the VRAM peak.
2026-02-17 00:43:48 +08:00 · 2025-09-27 21:38:40 +10:00 · 2025-09-27 21:38:40 +10:00 · 98ca6030f3
commit 98ca6030f3
parent 8866a22dcb
1 changed files with 1 additions and 0 deletions
--- a/comfy/ldm/wan/model.py
+++ b/comfy/ldm/wan/model.py
@ -237,6 +237,7 @@ class WanAttentionBlock(nn.Module):
            freqs, transformer_options=transformer_options)
        x = torch.addcmul(x, y, repeat_e(e[2], x))
        del y
        # cross-attention & ffn
        x = x + self.cross_attn(self.norm3(x), context, context_img_len=context_img_len, transformer_options=transformer_options)