fix performance regression due to Flash Attention duplicated code

2025-07-14 03:30:10 +00:00 · 2025-05-27 16:14:07 +08:00 · 2025-05-27 16:14:07 +08:00 · 2fc28056fa
commit 2fc28056fa
parent 3c7c6f8b29
1 changed files with 0 additions and 7 deletions
--- a/wan/distributed/xdit_context_parallel.py
+++ b/wan/distributed/xdit_context_parallel.py
@ -304,13 +304,6 @@ def usp_attn_forward(self,
            value=half(v),
            window_size=self.window_size)
    x = xFuserLongContextAttention()(
        None,
        query=half(q),
        key=half(k),
        value=half(v),
        window_size=self.window_size)
    # TODO: padding after attention.
    # x = torch.cat([x, x.new_zeros(b, s - x.size(1), n, d)], dim=1)