test.sh 669 Bytes
Newer Older
Rick Ho's avatar
Rick Ho committed
1
#!/bin/bash
Rick Ho's avatar
Rick Ho committed
2
if [ -z $MASTER_ADDR ]
Rick Ho's avatar
Rick Ho committed
3
then
Rick Ho's avatar
Rick Ho committed
4
5
6
7
8
9
    if [ -z $SLURM_JOB_ID ]
    then
        export MASTER_ADDR=localhost
    else
        export MASTER_ADDR=$(scontrol show JobId=$SLURM_JOB_ID | grep BatchHost | tr '=' ' ' | awk '{print $2}')
    fi
Rick Ho's avatar
Rick Ho committed
10
11
12
fi
if [ -z $MASTER_PORT ]
then
Rick Ho's avatar
Rick Ho committed
13
    export MASTER_PORT=12215
Rick Ho's avatar
Rick Ho committed
14
15
fi

Rick Ho's avatar
Rick Ho committed
16
17
18
19
20
if [ ! -z $OMPI_COMM_WORLD_RANK ]
then
    RANK=$OMPI_COMM_WORLD_RANK
    localrank=$OMPI_COMM_WORLD_LOCAL_RANK
elif [ ! -z $SLURM_PROCID ]
Rick Ho's avatar
Rick Ho committed
21
then
Rick Ho's avatar
Rick Ho committed
22
23
24
    export RANK=$SLURM_PROCID
    export WORLD_SIZE=$SLURM_NPROCS
    localrank=$SLURM_LOCALID
Rick Ho's avatar
Rick Ho committed
25
else
Rick Ho's avatar
Rick Ho committed
26
27
28
    RANK=0
    localrank=0
    WORLD_SIZE=1
Rick Ho's avatar
Rick Ho committed
29
30
fi

Rick Ho's avatar
Rick Ho committed
31
export CUDA_VISIBLE_DEVICES=$localrank
Rick Ho's avatar
Rick Ho committed
32

Rick Ho's avatar
Rick Ho committed
33
exec $@ 2>&1 | tee $RANK.log