run_GPT-MOE.sh 486 Bytes
Newer Older
silencealiang's avatar
add  
silencealiang committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
for para in $*
do
    if [[ $para == --profiling* ]];then
        profiling=${para#*=}
        export GPU_FLUSH_ON_EXECUTION=1
        export HIP_DIRECT_DISPATCH=0
    fi
done

mpirun -np 512 --hostfile hostfile_gptmoe \
              --allow-run-as-root \
              --bind-to none \
              --mca plm_rsh_no_tree_spawn 1 \
              train_GPT-MOE_567B.sh node002 --profiling=$profiling > output.log 2>&1

wait

rm -rf CKPT
#rm -rf mixtral_dataset/my-mixtral_text_document