Unverified Commit 22fe7878 authored by JieXin Liang's avatar JieXin Liang Committed by GitHub
Browse files

[sgl-kernel] update deepgemm (#6942)

parent c4ffbeca
......@@ -1719,7 +1719,10 @@ class DeepseekV2ForCausalLM(nn.Module):
logger,
"Only Deepseek V3/R1 on NV-platform can use shared experts fusion optimization. Shared experts fusion optimization is disabled.",
)
elif (global_server_args_dict["enable_deepep_moe"] or global_server_args_dict["enable_ep_moe"]):
elif (
global_server_args_dict["enable_deepep_moe"]
or global_server_args_dict["enable_ep_moe"]
):
self.num_fused_shared_experts = 0
global_server_args_dict["disable_shared_experts_fusion"] = True
log_info_on_rank0(
......
......@@ -53,7 +53,7 @@ FetchContent_Populate(repo-cutlass)
FetchContent_Declare(
repo-deepgemm
GIT_REPOSITORY https://github.com/deepseek-ai/DeepGEMM
GIT_TAG d75b218b7b8f4a5dd5406ac87905039ead3ae42f
GIT_TAG 8dfa3298274bfe6b242f6f8a3e6f3eff2707dd9f
GIT_SHALLOW OFF
)
FetchContent_Populate(repo-deepgemm)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment