run-13b-sft.sh 350 Bytes
Newer Older
qianyj's avatar
qianyj committed
1
2
3
4
5
echo "START TIME: $(date)"
hostfile=./hostfile

np=$(cat $hostfile|sort|uniq |wc -l)
np=$(($np*8))
zhaoying1's avatar
zhaoying1 committed
6
7
nodename=$(cat $hostfile |sed -n "1p")
dist_url=`echo $nodename | awk '{print $1}'`
qianyj's avatar
update  
qianyj committed
8

zhaoying1's avatar
zhaoying1 committed
9
mpirun -np $np --allow-run-as-root --hostfile ./hostfile1 -mca plm_rsh_args "-p 2345" -mca btl ^openib run-13b-sft-single.sh 8 $dist_url
qianyj's avatar
update  
qianyj committed
10

qianyj's avatar
qianyj committed
11
12
13
14
echo "END TIME: $(date)"