infer.sh 623 Bytes
Newer Older
chenzk's avatar
v1.0  
chenzk committed
1
# Text query
dcuai's avatar
dcuai committed
2
HIP_VISIBLE_DEVICES=0,1 python video_audio_demo.py --model_path vita/VITA_ckpt --image_path asset/vita_log2.png --model_type mixtral-8x7b --conv_mode mixtral_two --question "请描述这张图片。"
chenzk's avatar
v1.0  
chenzk committed
3
# Audio query
dcuai's avatar
dcuai committed
4
HIP_VISIBLE_DEVICES=0,1 python video_audio_demo.py --model_path vita/VITA_ckpt --image_path asset/vita_log2.png --model_type mixtral-8x7b --conv_mode mixtral_two --audio_path asset/q1.wav
chenzk's avatar
v1.0  
chenzk committed
5
# Noisy audio query
dcuai's avatar
dcuai committed
6
HIP_VISIBLE_DEVICES=0,1 python video_audio_demo.py --model_path vita/VITA_ckpt --image_path asset/vita_log2.png --model_type mixtral-8x7b --conv_mode mixtral_two --audio_path asset/q2.wav