From 5cb67c67e8d08badf7a64b76c2eded903982bf1b Mon Sep 17 00:00:00 2001 From: Bakhtiyor Sulaymonov Date: Thu, 27 Feb 2025 18:55:10 +0500 Subject: [PATCH] Fix MPS compatibility for I2V by adjusting device usage and dtype --- wan/configs/wan_i2v_14B.py | 2 +- wan/image2video.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/wan/configs/wan_i2v_14B.py b/wan/configs/wan_i2v_14B.py index 12e8e20..a666719 100644 --- a/wan/configs/wan_i2v_14B.py +++ b/wan/configs/wan_i2v_14B.py @@ -14,7 +14,7 @@ i2v_14B.t5_tokenizer = 'google/umt5-xxl' # clip i2v_14B.clip_model = 'clip_xlm_roberta_vit_h_14' -i2v_14B.clip_dtype = torch.float16 +i2v_14B.clip_dtype = torch.float32 i2v_14B.clip_checkpoint = 'models_clip_open-clip-xlm-roberta-large-vit-huge-14.pth' i2v_14B.clip_tokenizer = 'xlm-roberta-large' diff --git a/wan/image2video.py b/wan/image2video.py index 55d3f57..6bff1b8 100644 --- a/wan/image2video.py +++ b/wan/image2video.py @@ -244,7 +244,7 @@ class WanI2V: y = self.vae.encode([ torch.concat([ torch.nn.functional.interpolate( - img[None].cpu(), size=(h, w), mode='bicubic').transpose( + img[None], size=(h, w), mode='bicubic').transpose( 0, 1), torch.zeros(3, 80, h, w) ],