run_bytemlperf.sh 3.26 KB
Newer Older
sunzhq2's avatar
init  
sunzhq2 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
#!/bin/bash

export PYTHONPATH=/opt/dtk/lib:$PYTHONPAT
source /home/workspace/dtk-24.04.3/env.sh
export PYTHONPATH=/home/workspace/dtk-24.04.3/lib:$PYTHONPAT
export LD_LIBRARY_PATH=/home/workspace/rocblas-install/lib/:$LD_LIBRARY_PATH


# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task resnet50-torch-fp32 2>&1 | tee ./log/resnet50-torch-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task resnet50-torch-fp16 2>&1 | tee ./log/resnet50-torch-fp16.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task resnet50-onnxruntime-fp32 2>&1 | tee ./log/resnet50-onnxruntime-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task resnet50-onnxruntime-fp16 2>&1 | tee ./log/resnet50-onnxruntime-fp16.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-torch-fp32 2>&1 | tee ./log/bert-torch-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-torch-fp16 2>&1 | tee ./log/bert-torch-fp16.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-tf-fp32 2>&1 | tee ./log/bert-tf-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-tf-fp16 2>&1 | tee ./log/bert-tf-fp16.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-onnxruntime-fp32 2>&1 | tee ./log/bert-onnxruntime-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task bert-onnxruntime-fp16 2>&1 | tee ./log/bert-onnxruntime-fp16.log



# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task widedeep-tf-fp32 2>&1 | tee ./log/widedeep-tf-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task widedeep-tf-fp16 2>&1 | tee ./log/widedeep-tf-fp16.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task videobert-onnx-fp32 2>&1 | tee ./log/videobert-onnx-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task videobert-onnx-fp16 2>&1 | tee ./log/videobert-onnx-fp16.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task conformer-encoder-onnx-fp32 2>&1 | tee ./log/conformer-encoder-onnx-fp32.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task roformer-tf-fp32 2>&1 | tee ./log/roformer-tf-fp32.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task vae-encoder-onnx-fp32 2>&1 | tee ./log/vae-encoder-onnx-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task vae-decoder-onnx-fp32 2>&1 | tee ./log/vae-decoder-onnx-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task unet-onnx-fp32 2>&1 | tee ./log/unet-onnx-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task clip-onnx-fp32 2>&1 | tee ./log/clip-onnx-fp32.log


CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task yolov5-onnx-fp32 2>&1 | tee ./log/yolov5-onnx-fp32.log


# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task roberta-torch-fp32 2>&1 | tee ./log/roberta-torch-fp32.log

# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task deberta-torch-fp32 2>&1 | tee ./log/deberta-torch-fp32.log
# CUDA_VISIBLE_DEVICES=0 python launch.py --hardware_type DCU --task swin-large-torch-fp32 2>&1 | tee ./log/swin-large-torch-fp32.log