"vscode:/vscode.git/clone" did not exist on "c4209d6d21dab00bb02713757e729a2449082b1f"
README.md 2.2 KB
Newer Older
qianyj's avatar
qianyj committed
1
# 介绍
qianyj's avatar
qianyj committed
2

qianyj's avatar
qianyj committed
3
  该测试用例可用于ResNet50等网络的性能测试及精度验证。
qianyj's avatar
qianyj committed
4
5
6
7
8

# 单卡测试(单精度)

## 运行

qianyj's avatar
qianyj committed
9
    export PYTHONPATH=/path/to/tensorflow/model:$PYTHONPATH    
qianyj's avatar
qianyj committed
10
11
    export HIP_VISIBLE_DEVICES=0
    python3 official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py --data_dir=/path/to/{ImageNet-tensorflow_data_dir} --model_dir=/path/to/{model_save_dir} --batch_size=128 --num_gpus=1  --use_synthetic_data=false
qianyj's avatar
qianyj committed
12
  
qianyj's avatar
qianyj committed
13
# 单卡测试 (混合精度)
qianyj's avatar
qianyj committed
14

qianyj's avatar
qianyj committed
15
## 运行 
qianyj's avatar
qianyj committed
16

qianyj's avatar
qianyj committed
17
    export PYTHONPATH=/path/to/tensorflow/model:$PYTHONPATH
qianyj's avatar
qianyj committed
18
19
    export HIP_VISIBLE_DEVICES=0
    python3 official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py --data_dir=/path/to/{ImageNet-tensorflow_data_dir} --model_dir=/path/to/{model_save_dir} --batch_size=128 --num_gpus=1  --use_synthetic_data=false --dtype=fp16
qianyj's avatar
qianyj committed
20

qianyj's avatar
qianyj committed
21
22
23
# 多卡测试 (单精度)

## 运行
qianyj's avatar
qianyj committed
24
 
qianyj's avatar
qianyj committed
25
    # sed指令只需要执行一次,添加支持多卡运行的代码
qianyj's avatar
qianyj committed
26
    sed -i '101 r configfile' official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py
qianyj's avatar
qianyj committed
27
    
qianyj's avatar
qianyj committed
28
    export PYTHONPATH=/path/to/tensorflow/model:$PYTHONPATH
qianyj's avatar
qianyj committed
29
    mpirun -np ${num_gpu}  --hostfile hostfile  -mca btl self,tcp  --bind-to none scripts-run/single_process.sh
qianyj's avatar
qianyj committed
30
31
32
33

# 多卡测试 (混合精度)

## 运行
qianyj's avatar
qianyj committed
34
   
qianyj's avatar
qianyj committed
35
    # sed指令只需要执行一次,添加支持多卡运行的代码
qianyj's avatar
qianyj committed
36
    sed -i '101 r configfile' official/vision/image_classification/resnet/resnet_ctl_imagenet_main.py
qianyj's avatar
qianyj committed
37
38
39
    
    修改scripts-run/single_process.sh中的--dtype=fp16
    export PYTHONPATH=/path/to/tensorflow/model:$PYTHONPATH
qianyj's avatar
qianyj committed
40
    mpirun -np ${num_gpu}  --hostfile hostfile  -mca btl self,tcp  --bind-to none scripts-run/single_process.sh
qianyj's avatar
qianyj committed
41

qianyj's avatar
qianyj committed
42
# 测试说明
qianyj's avatar
qianyj committed
43

qianyj's avatar
qianyj committed
44
45
46
   多卡测试时需要修改部分代码,具体可参考https://tensorflow.google.cn/guide/migrate/multi_worker_cpu_gpu_training?hl=en
   
   hostfile格式参考:
qianyj's avatar
qianyj committed
47
     
qianyj's avatar
qianyj committed
48
49
50
51
     node1 slots=4
     node2 slots=4

   nodefile格式参考(与hostfile文件内保持一致,用于构造TF_CONFIG):
qianyj's avatar
qianyj committed
52
     
qianyj's avatar
qianyj committed
53
54
55
56
     node1
     node2
  
   上面多卡测试方法默认每节点4卡
qianyj's avatar
qianyj committed
57
58
59

# 参考
[https://github.com/tensorflow/models/tree/v2.7.0](https://github.com/tensorflow/models/tree/v2.7.0/official/vision/image_classification/resnet)
qianyj's avatar
qianyj committed
60