diff --git a/examples/bag.jpg b/examples/bag.jpg deleted file mode 100644 index 5f20514..0000000 Binary files a/examples/bag.jpg and /dev/null differ diff --git a/examples/girl.png b/examples/girl.png new file mode 100644 index 0000000..006321b Binary files /dev/null and b/examples/girl.png differ diff --git a/examples/heben.png b/examples/heben.png deleted file mode 100644 index 67ee4e5..0000000 Binary files a/examples/heben.png and /dev/null differ diff --git a/examples/snake.png b/examples/snake.png new file mode 100644 index 0000000..b23e1cc Binary files /dev/null and b/examples/snake.png differ diff --git a/generate.py b/generate.py index e4267ee..b7005ca 100644 --- a/generate.py +++ b/generate.py @@ -42,12 +42,12 @@ EXAMPLE_PROMPT = { "examples/flf2v_input_last_frame.png", }, "vace-1.3B": { - "src_ref_images": 'examples/bag.jpg,examples/heben.png', - "prompt": "优雅的女士在精品店仔细挑选包包,她身穿一袭黑色修身连衣裙,搭配珍珠项链,展现出成熟女性的魅力。手中拿着一款复古风格的棕色皮质半月形手提包,正细致地观察其工艺与质地。店内灯光柔和,木质装潢营造出温馨而高级的氛围。中景,侧拍捕捉女士挑选瞬间,展现其品味与气质。" + "src_ref_images": 'examples/girl.png,examples/snake.png', + "prompt": "在一个欢乐而充满节日气氛的场景中,穿着鲜艳红色春服的小女孩正与她的可爱卡通蛇嬉戏。她的春服上绣着金色吉祥图案,散发着喜庆的气息,脸上洋溢着灿烂的笑容。蛇身呈现出亮眼的绿色,形状圆润,宽大的眼睛让它显得既友善又幽默。小女孩欢快地用手轻轻抚摸着蛇的头部,共同享受着这温馨的时刻。周围五彩斑斓的灯笼和彩带装饰着环境,阳光透过洒在她们身上,营造出一个充满友爱与幸福的新年氛围。" }, "vace-14B": { - "src_ref_images": 'examples/bag.jpg,examples/heben.png', - "prompt": "优雅的女士在精品店仔细挑选包包,她身穿一袭黑色修身连衣裙,搭配珍珠项链,展现出成熟女性的魅力。手中拿着一款复古风格的棕色皮质半月形手提包,正细致地观察其工艺与质地。店内灯光柔和,木质装潢营造出温馨而高级的氛围。中景,侧拍捕捉女士挑选瞬间,展现其品味与气质。" + "src_ref_images": 'examples/girl.png,examples/snake.png', + "prompt": "在一个欢乐而充满节日气氛的场景中,穿着鲜艳红色春服的小女孩正与她的可爱卡通蛇嬉戏。她的春服上绣着金色吉祥图案,散发着喜庆的气息,脸上洋溢着灿烂的笑容。蛇身呈现出亮眼的绿色,形状圆润,宽大的眼睛让它显得既友善又幽默。小女孩欢快地用手轻轻抚摸着蛇的头部,共同享受着这温馨的时刻。周围五彩斑斓的灯笼和彩带装饰着环境,阳光透过洒在她们身上,营造出一个充满友爱与幸福的新年氛围。" } } diff --git a/tests/test.sh b/tests/test.sh index bf40cd7..6dd0986 100644 --- a/tests/test.sh +++ b/tests/test.sh @@ -105,9 +105,16 @@ function i2v_14B_720p() { torchrun --nproc_per_node=$GPUS $PY_FILE --task i2v-14B --ckpt_dir $I2V_14B_CKPT_DIR --size 720*1280 --dit_fsdp --t5_fsdp --ulysses_size $GPUS } +function vace_1_3B() { + VACE_1_3B_CKPT_DIR="$MODEL_DIR/VACE-Wan2.1-1.3B-Preview/" + torchrun --nproc_per_node=$GPUS $PY_FILE --ulysses_size $GPUS --task vace-1.3B --size 480*832 --ckpt_dir $VACE_1_3B_CKPT_DIR + +} + t2i_14B t2v_1_3B t2v_14B i2v_14B_480p i2v_14B_720p +vace_1_3B diff --git a/wan/distributed/xdit_context_parallel.py b/wan/distributed/xdit_context_parallel.py index 73ea8b6..e0be6c7 100644 --- a/wan/distributed/xdit_context_parallel.py +++ b/wan/distributed/xdit_context_parallel.py @@ -110,7 +110,7 @@ def usp_dit_forward( t: [B]. context: A list of text embeddings each with shape [L, C]. """ - if self.model_type != 'vace': + if self.model_type == 'i2v': assert clip_fea is not None and y is not None # params device = self.patch_embedding.weight.device