Unverified Commit 81fd2b0e authored by Zhengyi Lai's avatar Zhengyi Lai Committed by GitHub
Browse files

fix(deepep): resolve benchmark failure on 4×IB-card setup by aligning tuning...

fix(deepep): resolve benchmark failure on 4×IB-card setup by aligning tuning config with DeepEP commit bdd119f8 (#11965)
parent 007b849b
...@@ -381,8 +381,8 @@ def test_main( ...@@ -381,8 +381,8 @@ def test_main(
# Tune combine performance # Tune combine performance
best_time, best_results = 1e10, None best_time, best_results = 1e10, None
for nvl_chunk_size in range(1, 5, 1): for nvl_chunk_size in range(1, 8, 1):
for rdma_chunk_size in range(8, 33, 4): for rdma_chunk_size in range(12 if num_nodes == 2 else 8, 33, 4):
config_kwargs = { config_kwargs = {
"num_sms": num_sms, "num_sms": num_sms,
"num_max_nvl_chunked_send_tokens": nvl_chunk_size, "num_max_nvl_chunked_send_tokens": nvl_chunk_size,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment