infer.py 4.24 KB
Newer Older
helloyongyang's avatar
helloyongyang committed
1
import argparse
2

PengGao's avatar
PengGao committed
3
4
import torch.distributed as dist
from loguru import logger
5

PengGao's avatar
PengGao committed
6
from lightx2v.common.ops import *
PengGao's avatar
PengGao committed
7
from lightx2v.models.runners.cogvideox.cogvidex_runner import CogvideoxRunner  # noqa: F401
PengGao's avatar
PengGao committed
8
from lightx2v.models.runners.graph_runner import GraphRunner
PengGao's avatar
PengGao committed
9
from lightx2v.models.runners.hunyuan.hunyuan_runner import HunyuanRunner  # noqa: F401
10
from lightx2v.models.runners.qwen_image.qwen_image_runner import QwenImageRunner  # noqa: F401
sandy's avatar
sandy committed
11
from lightx2v.models.runners.wan.wan_audio_runner import Wan22AudioRunner, WanAudioRunner  # noqa: F401
PengGao's avatar
PengGao committed
12
13
14
15
from lightx2v.models.runners.wan.wan_causvid_runner import WanCausVidRunner  # noqa: F401
from lightx2v.models.runners.wan.wan_distill_runner import WanDistillRunner  # noqa: F401
from lightx2v.models.runners.wan.wan_runner import Wan22MoeRunner, WanRunner  # noqa: F401
from lightx2v.models.runners.wan.wan_skyreels_v2_df_runner import WanSkyreelsV2DFRunner  # noqa: F401
gushiqiao's avatar
gushiqiao committed
16
from lightx2v.models.runners.wan.wan_vace_runner import WanVaceRunner  # noqa: F401
PengGao's avatar
PengGao committed
17
18
19
from lightx2v.utils.envs import *
from lightx2v.utils.profiler import ProfilingContext
from lightx2v.utils.registry_factory import RUNNER_REGISTER
helloyongyang's avatar
helloyongyang committed
20
from lightx2v.utils.set_config import print_config, set_config, set_parallel_config
PengGao's avatar
PengGao committed
21
from lightx2v.utils.utils import seed_all
lijiaqi2's avatar
lijiaqi2 committed
22
23


helloyongyang's avatar
helloyongyang committed
24
25
26
27
28
def init_runner(config):
    seed_all(config.seed)

    if CHECK_ENABLE_GRAPH_MODE():
        default_runner = RUNNER_REGISTER[config.model_cls](config)
helloyongyang's avatar
helloyongyang committed
29
        default_runner.init_modules()
helloyongyang's avatar
helloyongyang committed
30
31
32
        runner = GraphRunner(default_runner)
    else:
        runner = RUNNER_REGISTER[config.model_cls](config)
gushiqiao's avatar
gushiqiao committed
33
        runner.init_modules()
helloyongyang's avatar
helloyongyang committed
34
35
36
    return runner


37
def main():
helloyongyang's avatar
helloyongyang committed
38
    parser = argparse.ArgumentParser()
wangshankun's avatar
wangshankun committed
39
    parser.add_argument(
40
41
42
        "--model_cls",
        type=str,
        required=True,
43
44
45
46
47
48
        choices=[
            "wan2.1",
            "hunyuan",
            "wan2.1_distill",
            "wan2.1_causvid",
            "wan2.1_skyreels_v2_df",
gushiqiao's avatar
gushiqiao committed
49
            "wan2.1_vace",
50
51
52
            "cogvideox",
            "wan2.1_audio",
            "wan2.2_moe",
helloyongyang's avatar
fix ci  
helloyongyang committed
53
            "wan2.2",
54
55
56
            "wan2.2_moe_audio",
            "wan2.2_audio",
            "wan2.2_moe_distill",
57
            "qwen_image",
58
        ],
59
        default="wan2.1",
wangshankun's avatar
wangshankun committed
60
    )
helloyongyang's avatar
helloyongyang committed
61

gushiqiao's avatar
gushiqiao committed
62
    parser.add_argument("--task", type=str, choices=["t2v", "i2v", "t2i", "i2i", "flf2v", "vace"], default="t2v")
helloyongyang's avatar
helloyongyang committed
63
    parser.add_argument("--model_path", type=str, required=True)
helloyongyang's avatar
helloyongyang committed
64
    parser.add_argument("--config_json", type=str, required=True)
65
    parser.add_argument("--use_prompt_enhancer", action="store_true")
helloyongyang's avatar
helloyongyang committed
66

wangshankun's avatar
wangshankun committed
67
    parser.add_argument("--prompt", type=str, default="", help="The input prompt for text-to-video generation")
helloyongyang's avatar
helloyongyang committed
68
    parser.add_argument("--negative_prompt", type=str, default="")
helloyongyang's avatar
helloyongyang committed
69
70

    parser.add_argument("--image_path", type=str, default="", help="The path to input image file for image-to-video (i2v) task")
gushiqiao's avatar
gushiqiao committed
71
    parser.add_argument("--last_frame_path", type=str, default="", help="The path to last frame file for first-last-frame-to-video (flf2v) task")
helloyongyang's avatar
helloyongyang committed
72
73
    parser.add_argument("--audio_path", type=str, default="", help="The path to input audio file for audio-to-video (a2v) task")

gushiqiao's avatar
gushiqiao committed
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
    parser.add_argument(
        "--src_ref_images",
        type=str,
        default=None,
        help="The file list of the source reference images. Separated by ','. Default None.",
    )
    parser.add_argument(
        "--src_video",
        type=str,
        default=None,
        help="The file of the source video. Default None.",
    )
    parser.add_argument(
        "--src_mask",
        type=str,
        default=None,
        help="The file of the source mask. Default None.",
    )

93
    parser.add_argument("--save_video_path", type=str, default="./output_lightx2v.mp4", help="The path to save video path/file")
helloyongyang's avatar
helloyongyang committed
94
    args = parser.parse_args()
PengGao's avatar
PengGao committed
95

helloyongyang's avatar
helloyongyang committed
96
97
98
    # set config
    config = set_config(args)

helloyongyang's avatar
fix bug  
helloyongyang committed
99
    if config.parallel:
helloyongyang's avatar
helloyongyang committed
100
101
102
103
        dist.init_process_group(backend="nccl")
        torch.cuda.set_device(dist.get_rank())
        set_parallel_config(config)

helloyongyang's avatar
helloyongyang committed
104
105
    print_config(config)

helloyongyang's avatar
helloyongyang committed
106
    with ProfilingContext("Total Cost"):
helloyongyang's avatar
helloyongyang committed
107
        runner = init_runner(config)
108
        runner.run_pipeline()
Xinchi Huang's avatar
Xinchi Huang committed
109

helloyongyang's avatar
helloyongyang committed
110
111
112
113
114
    # Clean up distributed process group
    if dist.is_initialized():
        dist.destroy_process_group()
        logger.info("Distributed process group cleaned up")

Xinchi Huang's avatar
Xinchi Huang committed
115
116

if __name__ == "__main__":
117
    main()