"...sox/git@developer.sourcefind.cn:OpenDAS/torchaudio.git" did not exist on "dde08ba1be29ee62016083b0bf39454136d48362"
Unverified Commit 4039c626 authored by AlphaBaby's avatar AlphaBaby Committed by GitHub
Browse files

fix deepep assert when PD disaggregation == null (#8274)


Co-authored-by: default avatarfujianhao.fjh <fujianhao.fjh@antgroup.com>
parent db71c38f
...@@ -164,10 +164,19 @@ class DeepEPBuffer: ...@@ -164,10 +164,19 @@ class DeepEPBuffer:
num_rdma_bytes, num_rdma_bytes,
) )
# We should calculate num_qps_per_rank consistently with DeepEP's test script logic:
if deepep_mode == DeepEPMode.NORMAL: if deepep_mode == DeepEPMode.NORMAL:
num_qps_per_rank = DeepEPConfig.get_instance().num_sms // 2 # refer: https://github.com/deepseek-ai/DeepEP/blob/main/tests/test_internode.py#L235
elif deepep_mode in [DeepEPMode.LOW_LATENCY, DeepEPMode.AUTO]: num_qps_per_rank = DeepEPConfig.get_instance().num_sms
elif deepep_mode == DeepEPMode.LOW_LATENCY:
# refer: https://github.com/deepseek-ai/DeepEP/blob/main/tests/test_low_latency.py#L176
num_qps_per_rank = num_experts // group.size() num_qps_per_rank = num_experts // group.size()
elif deepep_mode == DeepEPMode.AUTO:
# low-latency and normal mode all need run
# refer: https://github.com/deepseek-ai/DeepEP/blob/main/tests/test_internode.py#L235
num_qps_per_rank = max(
DeepEPConfig.get_instance().num_sms, num_experts // group.size()
)
else: else:
raise NotImplementedError raise NotImplementedError
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment