train.sh 298 Bytes
Newer Older
Rayyyyy's avatar
Rayyyyy committed
1
2
3
4
5
6
7
8
9
#!/bin/bash
echo "Export params ..."

export HIP_VISIBLE_DEVICES=0,1,2,3 # 自行修改为训练的卡号和数量
export HSA_FORCE_FINE_GRAIN_PCIE=1
export USE_MIOPEN_BATCHNORM=1

echo "Training start ..."

Rayyyyy's avatar
Rayyyyy committed
10
torchrun --nproc_per_node=4 training_stsbenchmark.py --train_batch_size 64 --num_epochs 5