Unverified Commit 7218f839 authored by Pleaplusone's avatar Pleaplusone Committed by GitHub
Browse files

[ROCm][BugFix] Fix shared expert loading error when disable...


[ROCm][BugFix] Fix shared expert loading error when disable `VLLM_ROCM_USE_AITER_FUSION_SHARED_EXPERTS` (#28633)
Signed-off-by: default avatarganyi <ygan@amd.com>
parent 20e4497b
...@@ -287,7 +287,10 @@ class DeepseekV2MoE(nn.Module): ...@@ -287,7 +287,10 @@ class DeepseekV2MoE(nn.Module):
) )
self.is_rocm_aiter_moe_enabled = rocm_aiter_ops.is_fused_moe_enabled() self.is_rocm_aiter_moe_enabled = rocm_aiter_ops.is_fused_moe_enabled()
if config.n_shared_experts is None or self.is_rocm_aiter_moe_enabled: self.is_fusion_moe_shared_experts_enabled = (
rocm_aiter_ops.is_fusion_moe_shared_experts_enabled()
)
if config.n_shared_experts is None or self.is_fusion_moe_shared_experts_enabled:
self.shared_experts = None self.shared_experts = None
else: else:
intermediate_size = config.moe_intermediate_size * config.n_shared_experts intermediate_size = config.moe_intermediate_size * config.n_shared_experts
...@@ -327,7 +330,7 @@ class DeepseekV2MoE(nn.Module): ...@@ -327,7 +330,7 @@ class DeepseekV2MoE(nn.Module):
num_redundant_experts=self.n_redundant_experts, num_redundant_experts=self.n_redundant_experts,
is_sequence_parallel=self.is_sequence_parallel, is_sequence_parallel=self.is_sequence_parallel,
n_shared_experts=config.n_shared_experts n_shared_experts=config.n_shared_experts
if rocm_aiter_ops.is_fusion_moe_shared_experts_enabled() if self.is_fusion_moe_shared_experts_enabled
else None, else None,
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment