1node_op_test.sh 950 Bytes
Newer Older
yuguo's avatar
yuguo committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
#!/bin/bash
set -xe

export TF_CPP_MIN_LOG_LEVEL=3
export PYTHONUNBUFFERED=1

src_dir=${ONEFLOW_SRC_DIR:-"$PWD"}
test_tmp_dir=${ONEFLOW_TEST_TMP_DIR:-"./test_tmp_dir"}


rm -rf $test_tmp_dir
mkdir -p $test_tmp_dir
cp -r $src_dir/python/oneflow/compatible/single_client/test $test_tmp_dir
cd $test_tmp_dir

python3 -m oneflow --doctor

gpu_num=$(nvidia-smi --query-gpu=name --format=csv,noheader | wc -l)
for CHUNK in 1
do
	export ONEFLOW_TEST_DEVICE_NUM=${CHUNK}
    python3 $src_dir/ci/test/parallel_run.py \
        --gpu_num="${gpu_num}" \
        --dir=test/ops \
        --timeout=1 \
        --verbose \
        --chunk=${CHUNK}
done

if [ -z "$ONEFLOW_TEST_ENABLE_EAGER" ]
then
    export ONEFLOW_TEST_DEVICE_NUM=2
    python3 -m unittest discover test/ops --failfast --verbose

    export ONEFLOW_TEST_DEVICE_NUM=4
    python3 -m unittest discover test/ops --failfast --verbose
else
    echo "deadlock unsolved, skipping multi-card eager"
fi