infer.sh 157 Bytes
Newer Older
Xuanlei Zhao's avatar
Xuanlei Zhao committed
1
2
3
4
5
6
7
NUM_GPU=2
MODEL="mistralai/Mixtral-8x7B-v0.1"

# ep
torchrun --standalone --nproc_per_node $NUM_GPU infer.py \
    --model_name $MODEL \
    --plugin "ep" \