Merge pull request #370 from sfinktah/sfink-debug

Fix for AMD error when not using tiled VAE decoding
2026-01-12 01:03:44 +00:00 · 2025-06-18 00:41:27 +02:00 · 2025-06-18 00:41:27 +02:00 · e8dc653604
commit e8dc653604
parent b562190b93 4ca0666aa5
1 changed files with 21 additions and 3 deletions
--- a/wan/modules/vae.py
+++ b/wan/modules/vae.py
@ -33,9 +33,27 @@ class CausalConv3d(nn.Conv3d):
            padding[4] -= cache_x.shape[2]
            cache_x = None
        x = F.pad(x, padding)
-        x = super().forward(x)
+        try:
-
+            out = super().forward(x)
-        return x
+            return out
        except RuntimeError as e:
            if "miopenStatus" in str(e):
                print("⚠️ MIOpen fallback: AMD gets upset when trying to work with large areas, and so CPU will be "
                      "used for this decoding (which is very slow). Consider using tiled VAE Decoding.")
                x_cpu = x.float().cpu()
                weight_cpu = self.weight.float().cpu()
                bias_cpu = self.bias.float().cpu() if self.bias is not None else None
                print(f"[Fallback] x shape: {x_cpu.shape}, weight shape: {weight_cpu.shape}")
                out = F.conv3d(x_cpu, weight_cpu, bias_cpu,
                               self.stride, (0, 0, 0),  # avoid double padding here
                               self.dilation, self.groups)
                out = out.to(x.device)
                if x.dtype in (torch.float16, torch.bfloat16):
                    out = out.half()
                if x.dtype != out.dtype:
                    out = out.to(x.dtype)
                return out
            raise
 class RMS_norm(nn.Module):