Unverified Commit a564e001 authored by fzyzcjy's avatar fzyzcjy Committed by GitHub
Browse files

Fix DeepEP error in Qwen 3 MoE models (#6673)

parent 2103b806
...@@ -93,17 +93,20 @@ class DeepEPBuffer: ...@@ -93,17 +93,20 @@ class DeepEPBuffer:
), ),
num_rdma_bytes, num_rdma_bytes,
) )
if deepep_mode == DeepEPMode.normal:
num_qps_per_rank = DeepEPConfig.get_instance().num_sms // 2
elif deepep_mode in [DeepEPMode.low_latency, DeepEPMode.auto]:
num_qps_per_rank = num_experts // group.size()
else:
raise NotImplementedError
cls._buffer = Buffer( cls._buffer = Buffer(
group, group,
num_nvl_bytes, num_nvl_bytes,
num_rdma_bytes, num_rdma_bytes,
low_latency_mode=deepep_mode.enable_low_latency(), low_latency_mode=deepep_mode.enable_low_latency(),
num_qps_per_rank=( num_qps_per_rank=num_qps_per_rank,
max(
num_experts // group.size(),
DeepEPConfig.get_instance().num_sms // 2,
)
),
) )
return cls._buffer return cls._buffer
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment