Unverified Commit d93d2d74 authored by YiSheng5's avatar YiSheng5 Committed by GitHub
Browse files

[XPU] Make pp group initilized for pipeline-parallelism (#11648)


Signed-off-by: default avataryisheng <yi.sheng@intel.com>
parent d0169e1b
...@@ -11,6 +11,7 @@ import torch.distributed ...@@ -11,6 +11,7 @@ import torch.distributed
from vllm.config import VllmConfig from vllm.config import VllmConfig
from vllm.distributed import (ensure_model_parallel_initialized, from vllm.distributed import (ensure_model_parallel_initialized,
init_distributed_environment) init_distributed_environment)
from vllm.distributed.parallel_state import get_pp_group
from vllm.logger import init_logger from vllm.logger import init_logger
from vllm.model_executor import set_random_seed from vllm.model_executor import set_random_seed
from vllm.platforms import current_platform from vllm.platforms import current_platform
...@@ -176,3 +177,8 @@ class XPUWorker(LoraNotSupportedWorkerBase, Worker): ...@@ -176,3 +177,8 @@ class XPUWorker(LoraNotSupportedWorkerBase, Worker):
parallel_config.pipeline_parallel_size) parallel_config.pipeline_parallel_size)
# global all_reduce needed for overall oneccl warm up # global all_reduce needed for overall oneccl warm up
torch.distributed.all_reduce(torch.zeros(1).xpu()) torch.distributed.all_reduce(torch.zeros(1).xpu())
if parallel_config.pipeline_parallel_size > 1:
# Add pp group init to avoid
# p2p communication as the first call
get_pp_group().all_reduce(torch.zeros(1).xpu())
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment