Unverified Commit 19b5917c authored by Alec's avatar Alec Committed by GitHub
Browse files

fix: assign unique ports per vLLM worker to avoid ZMQ bind conflicts (#5224)


Signed-off-by: default avataralec-flowers <aflowers@nvidia.com>
parent 15a2e8de
...@@ -251,8 +251,9 @@ else ...@@ -251,8 +251,9 @@ else
VLLM_ARGS+=("--is-decode-worker") VLLM_ARGS+=("--is-decode-worker")
fi fi
VLLM_ARGS+=("${EXTRA_ARGS[@]}") VLLM_ARGS+=("${EXTRA_ARGS[@]}")
VLLM_ARGS+=("--request-plane" "nats")
exec env PYTHONHASHSEED=0 CUDA_VISIBLE_DEVICES=$GPU_DEVICES python3 -m dynamo.vllm \ exec env PYTHONHASHSEED=0 CUDA_VISIBLE_DEVICES=$GPU_DEVICES DYN_VLLM_KV_EVENT_PORT=$((20080 + i)) VLLM_NIXL_SIDE_CHANNEL_PORT=$((20096 + i)) python3 -m dynamo.vllm \
"${VLLM_ARGS[@]}" "${VLLM_ARGS[@]}"
fi fi
} & } &
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment