Unverified Commit 99a0704a authored by Mike Qiu's avatar Mike Qiu Committed by GitHub
Browse files

bailingMoE: Fix Key error of deepep_mode (#11465)


Signed-off-by: default avatarMichael Qiu <qiudayu.qdy@antgroup.com>
Co-authored-by: default avatarMike_Qiu <qiudayu.qdy@antgroup.com>
parent ec1cd90a
......@@ -54,7 +54,7 @@ from sglang.srt.layers.linear import (
RowParallelLinear,
)
from sglang.srt.layers.logits_processor import LogitsProcessor
from sglang.srt.layers.moe import get_moe_a2a_backend
from sglang.srt.layers.moe import get_deepep_mode, get_moe_a2a_backend
from sglang.srt.layers.moe.ep_moe.layer import get_moe_impl_class
from sglang.srt.layers.moe.fused_moe_triton.layer import FusedMoE
from sglang.srt.layers.moe.token_dispatcher import DeepEPDispatcher
......@@ -293,7 +293,7 @@ class BailingMoESparseMoeBlock(nn.Module):
num_local_experts=config.num_experts // self.tp_size,
hidden_size=config.hidden_size,
params_dtype=config.torch_dtype,
deepep_mode=DeepEPMode[global_server_args_dict["deepep_mode"]],
deepep_mode=get_deepep_mode(),
async_finish=True, # TODO
return_recv_hook=True,
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment