fix performance regression due to Flash Attention duplicated code

2025-07-13 11:10:11 +00:00 · 2025-05-27 16:14:07 +08:00 · 2025-05-27 16:14:07 +08:00 · 2fc28056fa
commit 2fc28056fa
parent 3c7c6f8b29
1 changed files with 0 additions and 7 deletions
--- a/wan/distributed/xdit_context_parallel.py
+++ b/wan/distributed/xdit_context_parallel.py
@ -304,13 +304,6 @@ def usp_attn_forward(self,
            value=half(v),
            window_size=self.window_size)

-    x = xFuserLongContextAttention()(
-        None,
-        query=half(q),
-        key=half(k),
-        value=half(v),
-        window_size=self.window_size)
-
    # TODO: padding after attention.
    # x = torch.cat([x, x.new_zeros(b, s - x.size(1), n, d)], dim=1)