infer.py 5.4 KB
Newer Older
helloyongyang's avatar
helloyongyang committed
1
import argparse
2

Yang Yong(雍洋)'s avatar
Yang Yong(雍洋) committed
3
import torch
PengGao's avatar
PengGao committed
4
5
import torch.distributed as dist
from loguru import logger
Gu Shiqiao's avatar
Gu Shiqiao committed
6

PengGao's avatar
PengGao committed
7
from lightx2v.common.ops import *
Zhuguanyu Wu's avatar
Zhuguanyu Wu committed
8
from lightx2v.models.runners.hunyuan_video.hunyuan_video_15_distill_runner import HunyuanVideo15DistillRunner  # noqa: F401
Yang Yong (雍洋)'s avatar
Yang Yong (雍洋) committed
9
from lightx2v.models.runners.hunyuan_video.hunyuan_video_15_runner import HunyuanVideo15Runner  # noqa: F401
10
from lightx2v.models.runners.qwen_image.qwen_image_runner import QwenImageRunner  # noqa: F401
11
from lightx2v.models.runners.wan.wan_animate_runner import WanAnimateRunner  # noqa: F401
sandy's avatar
sandy committed
12
from lightx2v.models.runners.wan.wan_audio_runner import Wan22AudioRunner, WanAudioRunner  # noqa: F401
PengGao's avatar
PengGao committed
13
from lightx2v.models.runners.wan.wan_distill_runner import WanDistillRunner  # noqa: F401
14
from lightx2v.models.runners.wan.wan_matrix_game2_runner import WanSFMtxg2Runner  # noqa: F401
PengGao's avatar
PengGao committed
15
from lightx2v.models.runners.wan.wan_runner import Wan22MoeRunner, WanRunner  # noqa: F401
16
from lightx2v.models.runners.wan.wan_sf_runner import WanSFRunner  # noqa: F401
gushiqiao's avatar
gushiqiao committed
17
from lightx2v.models.runners.wan.wan_vace_runner import WanVaceRunner  # noqa: F401
PengGao's avatar
PengGao committed
18
from lightx2v.utils.envs import *
19
from lightx2v.utils.input_info import set_input_info
20
from lightx2v.utils.profiler import *
PengGao's avatar
PengGao committed
21
from lightx2v.utils.registry_factory import RUNNER_REGISTER
helloyongyang's avatar
helloyongyang committed
22
from lightx2v.utils.set_config import print_config, set_config, set_parallel_config
PengGao's avatar
PengGao committed
23
from lightx2v.utils.utils import seed_all
24
25
from lightx2v_platform.base.global_var import AI_DEVICE
from lightx2v_platform.registry_factory import PLATFORM_DEVICE_REGISTER
lijiaqi2's avatar
lijiaqi2 committed
26
27


helloyongyang's avatar
helloyongyang committed
28
def init_runner(config):
Yang Yong(雍洋)'s avatar
Yang Yong(雍洋) committed
29
    torch.set_grad_enabled(False)
30
    runner = RUNNER_REGISTER[config["model_cls"]](config)
Yang Yong(雍洋)'s avatar
Yang Yong(雍洋) committed
31
    runner.init_modules()
helloyongyang's avatar
helloyongyang committed
32
33
34
    return runner


35
def main():
helloyongyang's avatar
helloyongyang committed
36
    parser = argparse.ArgumentParser()
37
    parser.add_argument("--seed", type=int, default=42, help="The seed for random generator")
wangshankun's avatar
wangshankun committed
38
    parser.add_argument(
39
40
41
        "--model_cls",
        type=str,
        required=True,
42
43
44
        choices=[
            "wan2.1",
            "wan2.1_distill",
gushiqiao's avatar
gushiqiao committed
45
            "wan2.1_vace",
46
            "wan2.1_sf",
47
            "wan2.1_sf_mtxg2",
Yang Yong(雍洋)'s avatar
Yang Yong(雍洋) committed
48
            "seko_talk",
49
            "wan2.2_moe",
helloyongyang's avatar
fix ci  
helloyongyang committed
50
            "wan2.2",
51
52
53
            "wan2.2_moe_audio",
            "wan2.2_audio",
            "wan2.2_moe_distill",
54
            "qwen_image",
55
            "wan2.2_animate",
Yang Yong (雍洋)'s avatar
Yang Yong (雍洋) committed
56
            "hunyuan_video_1.5",
Zhuguanyu Wu's avatar
Zhuguanyu Wu committed
57
            "hunyuan_video_1.5_distill",
58
        ],
59
        default="wan2.1",
wangshankun's avatar
wangshankun committed
60
    )
helloyongyang's avatar
helloyongyang committed
61

62
    parser.add_argument("--task", type=str, choices=["t2v", "i2v", "t2i", "i2i", "flf2v", "vace", "animate", "s2v"], default="t2v")
helloyongyang's avatar
helloyongyang committed
63
    parser.add_argument("--model_path", type=str, required=True)
64
    parser.add_argument("--sf_model_path", type=str, required=False)
helloyongyang's avatar
helloyongyang committed
65
    parser.add_argument("--config_json", type=str, required=True)
66
    parser.add_argument("--use_prompt_enhancer", action="store_true")
helloyongyang's avatar
helloyongyang committed
67

wangshankun's avatar
wangshankun committed
68
    parser.add_argument("--prompt", type=str, default="", help="The input prompt for text-to-video generation")
helloyongyang's avatar
helloyongyang committed
69
    parser.add_argument("--negative_prompt", type=str, default="")
helloyongyang's avatar
helloyongyang committed
70
71

    parser.add_argument("--image_path", type=str, default="", help="The path to input image file for image-to-video (i2v) task")
gushiqiao's avatar
gushiqiao committed
72
    parser.add_argument("--last_frame_path", type=str, default="", help="The path to last frame file for first-last-frame-to-video (flf2v) task")
sandy's avatar
sandy committed
73
    parser.add_argument("--audio_path", type=str, default="", help="The path to input audio file or directory for audio-to-video (s2v) task")
helloyongyang's avatar
helloyongyang committed
74

sandy's avatar
sandy committed
75
    # [Warning] For vace task, need refactor.
gushiqiao's avatar
gushiqiao committed
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
    parser.add_argument(
        "--src_ref_images",
        type=str,
        default=None,
        help="The file list of the source reference images. Separated by ','. Default None.",
    )
    parser.add_argument(
        "--src_video",
        type=str,
        default=None,
        help="The file of the source video. Default None.",
    )
    parser.add_argument(
        "--src_mask",
        type=str,
        default=None,
        help="The file of the source mask. Default None.",
    )
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
    parser.add_argument(
        "--src_pose_path",
        type=str,
        default=None,
        help="The file of the source pose. Default None.",
    )
    parser.add_argument(
        "--src_face_path",
        type=str,
        default=None,
        help="The file of the source face. Default None.",
    )
    parser.add_argument(
        "--src_bg_path",
        type=str,
        default=None,
        help="The file of the source background. Default None.",
    )
    parser.add_argument(
        "--src_mask_path",
        type=str,
        default=None,
        help="The file of the source mask. Default None.",
    )
118
119
    parser.add_argument("--save_result_path", type=str, default=None, help="The path to save video path/file")
    parser.add_argument("--return_result_tensor", action="store_true", help="Whether to return result tensor. (Useful for comfyui)")
helloyongyang's avatar
helloyongyang committed
120
    args = parser.parse_args()
PengGao's avatar
PengGao committed
121

122
123
    seed_all(args.seed)

helloyongyang's avatar
helloyongyang committed
124
125
126
    # set config
    config = set_config(args)

127
    if config["parallel"]:
128
129
        platform_device = PLATFORM_DEVICE_REGISTER.get(AI_DEVICE, None)
        platform_device.init_parallel_env()
helloyongyang's avatar
helloyongyang committed
130
131
        set_parallel_config(config)

helloyongyang's avatar
helloyongyang committed
132
133
    print_config(config)

134
    with ProfilingContext4DebugL1("Total Cost"):
helloyongyang's avatar
helloyongyang committed
135
        runner = init_runner(config)
136
137
        input_info = set_input_info(args)
        runner.run_pipeline(input_info)
Xinchi Huang's avatar
Xinchi Huang committed
138

helloyongyang's avatar
helloyongyang committed
139
140
141
142
143
    # Clean up distributed process group
    if dist.is_initialized():
        dist.destroy_process_group()
        logger.info("Distributed process group cleaned up")

Xinchi Huang's avatar
Xinchi Huang committed
144
145

if __name__ == "__main__":
146
    main()