"applications/Chat/examples/ray/mmmt_prompt.py" did not exist on "41fb7236aa32c307e83b0b9cc50ce2a6da279343"
run.sh 460 Bytes
Newer Older
1
# distplan in ["colossalai", "zero1", "zero2", "torch_ddp", "torch_zero"]
2
3
4
5
6
7
8
9
10
export DISTPAN="colossalai"

# The following options only valid when DISTPAN="colossalai"
export TPDEGREE=2
export GPUNUM=4
export PLACEMENT='cpu'
export USE_SHARD_INIT=False

env OMP_NUM_THREADS=16 torchrun --standalone --nproc_per_node=${GPUNUM} train_gpt_demo.py --tp_degree=${TPDEGREE} --placement ${PLACEMENT} --shardinit ${USE_SHARD_INIT} --distplan ${DISTPAN} 2>&1 | tee run.log