run_wan_i2v_audio.sh 1.28 KB
Newer Older
wangshankun's avatar
wangshankun committed
1
2
3
#!/bin/bash

# set path and first
4
5
lightx2v_path=/mtc/gushiqiao/llmc_workspace/LightX2V
model_path=/data/nvme0/gushiqiao/models/Lightx2v_models/Wan2.1-R2V721-Audio-14B-720P
sandy's avatar
sandy committed
6

7
8

export CUDA_VISIBLE_DEVICES=2
wangshankun's avatar
wangshankun committed
9

helloyongyang's avatar
helloyongyang committed
10
11
# set environment variables
source ${lightx2v_path}/scripts/base/base.sh
12
13
14
15

export TORCH_CUDA_ARCH_LIST="9.0"
export PYTORCH_CUDA_ALLOC_CONF=expandable_segments:True

helloyongyang's avatar
helloyongyang committed
16
17
18
export ENABLE_GRAPH_MODE=false
export SENSITIVE_LAYER_DTYPE=None

wangshankun's avatar
wangshankun committed
19
20
21
22
python -m lightx2v.infer \
--model_cls wan2.1_audio \
--task i2v \
--model_path $model_path \
wangshankun's avatar
wangshankun committed
23
--config_json ${lightx2v_path}/configs/audio_driven/wan_i2v_audio.json \
24
--prompt  "The video features a old lady is saying something and knitting a sweater." \
wangshankun's avatar
wangshankun committed
25
26
27
--negative_prompt 色调艳丽,过曝,静态,细节模糊不清,字幕,风格,作品,画作,画面,静止,整体发灰,最差质量,低质量,JPEG压缩残留,丑陋的,残缺的,多余的手指,画得不好的手部,画得不好的脸部,畸形的,毁容的,形态畸形的肢体,手指融合,静止不动的画面,杂乱的背景,三条腿,背景人很多,倒着走 \
--image_path ${lightx2v_path}/assets/inputs/audio/15.png \
--audio_path ${lightx2v_path}/assets/inputs/audio/15.wav \
wangshankun's avatar
wangshankun committed
28
--save_video_path ${lightx2v_path}/save_results/output_lightx2v_wan_i2v_audio.mp4