start_torch_fp8.sh 223 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
3
4
5
6
7
8
#!/bin/bash

export NCCL_ALGO=Ring
export NCCL_PROTO=Simple
export MP=8
export CONFIG=config.json

torchrun --nproc-per-node ${MP} generate.py --ckpt-path /path/of/DeepSeek-V4-Flash-FP8-MP8 --config ${CONFIG} --interactive