"vscode:/vscode.git/clone" did not exist on "b9a7f32674a28069a8d08a8bd544193b834977be"
Unverified Commit b57d87c2 authored by fzyzcjy's avatar fzyzcjy Committed by GitHub
Browse files

Fix shared experts fusion + weight requant (#7177)

parent 98538822
......@@ -1960,14 +1960,15 @@ class DeepseekV2ForCausalLM(nn.Module):
)
if layer_id in moe_layers:
shared_experts = layer.mlp.shared_experts
for module in [
shared_experts.gate_up_proj,
shared_experts.down_proj,
]:
requant_weight_ue8m0_inplace(
module.weight, module.weight_scale_inv, weight_block_size
)
shared_experts = getattr(layer.mlp, "shared_experts", None)
if shared_experts is not None:
for module in [
shared_experts.gate_up_proj,
shared_experts.down_proj,
]:
requant_weight_ue8m0_inplace(
module.weight, module.weight_scale_inv, weight_block_size
)
experts = layer.mlp.experts
if isinstance(experts, DeepEPMoE):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment