train.sh 775 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
3
#!/bin/bash
echo "Export params ..."

chenych's avatar
chenych committed
4
export HIP_VISIBLE_DEVICES=0,1,2,3 # 自行修改为训练的卡号和数量
chenych's avatar
chenych committed
5
6
7
8
9
export HSA_FORCE_FINE_GRAIN_PCIE=1
export USE_MIOPEN_BATCHNORM=1

echo "Training start ..."
# coco_path是训练数据集地址,数据是coco format
chenych's avatar
update  
chenych committed
10
11
12
13
14
15
16
# python -m torch.distributed.launch --nproc_per_node=4 --use_env main.py --coco_path /path/to/coco
# python -m torch.distributed.launch --nproc_per_node=4 --use_env main.py --coco_path /home/datasets/COCO2017 --epochs 300 > log_detr_2_4_dcu.20231205
python -m torch.distributed.launch --nproc_per_node=4 --use_env main.py \
    --coco_path /home/datasets/COCO2017 \
    --resume ./pretrained_model/detr-r50-e632da11.pth \
    --lr 1e-6 \
    --epochs 5 > log_detr_2_4_dcu.20231205
chenych's avatar
chenych committed
17
18

echo "Training finished."