start_sglang.sh 410 Bytes
Newer Older
chenych's avatar
chenych committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
export HSA_FORCE_FINE_GRAIN_PCIE=1
export HIP_VISIBLE_DEVICES=0,1,2,3,4,5,6,7
export NCCL_IB_HCA=mlx5_0:1

NODE_RANK=$1

python3 -m sglang.launch_server \
    --model meituan-longcat/LongCat-Flash-Chat \
    --trust-remote-code \
    --dtype bfloat16 \
    --enable-ep-moe \
    --tp 32 \
    --nnodes 4 \
    --node-rank $NODE_RANK \
    --host 127.0.0.2 \
    --port 8001 \
    --dist-init-addr x.x.x.x:20000