train.sh 647 Bytes
Newer Older
Rayyyyy's avatar
Rayyyyy committed
1
#!/bin/bash
Rayyyyy's avatar
Rayyyyy committed
2
export HIP_VISIBLE_DEVICES=0,1,2,3 # 自行修改为训练的卡号和数量
Rayyyyy's avatar
Rayyyyy committed
3
4
5
export HSA_FORCE_FINE_GRAIN_PCIE=1
export USE_MIOPEN_BATCHNORM=1

Rayyyyy's avatar
Rayyyyy committed
6
7
8
9
10
11
12
13
echo "Training start ..."
## train multi
# python -m torch.distributed.launch --nproc_per_node=4 --master_port=4321 realesrgan/train.py -opt options/train_realesrnet_x4plus.yml --launcher pytorch --auto_resume
## train single
# python realesrgan/train.py -opt options/train_realesrnet_x4plus.yml --auto_resume

## finetune
python -m torch.distributed.launch --nproc_per_node=4 --master_port=4321 realesrgan/train.py -opt options/finetune_realesrgan_x4plus.yml --launcher pytorch --auto_resume