Unverified Commit 0ca3e568 authored by fzyzcjy's avatar fzyzcjy Committed by GitHub
Browse files

Tiny fix missing expert location dispatch info (#6620)

parent 5c7aa009
...@@ -360,6 +360,9 @@ class DeepseekV2MoE(nn.Module): ...@@ -360,6 +360,9 @@ class DeepseekV2MoE(nn.Module):
correction_bias=self.correction_bias, correction_bias=self.correction_bias,
routed_scaling_factor=self.routed_scaling_factor, routed_scaling_factor=self.routed_scaling_factor,
num_token_non_padded=forward_batch.num_token_non_padded, num_token_non_padded=forward_batch.num_token_non_padded,
expert_location_dispatch_info=ExpertLocationDispatchInfo.init_new(
layer_id=self.layer_id,
),
) )
else: else:
topk_idx = torch.full( topk_idx = torch.full(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment