Unverified Commit ec7d9e67 authored by danisereb's avatar danisereb Committed by GitHub
Browse files

Fix call to moe_mk in modelopt MoE modules (required for LoRA) (#34575)


Signed-off-by: default avatarDaniel Serebrenik <daserebrenik@nvidia.com>
parent 3bb4e431
...@@ -977,11 +977,11 @@ class ModelOptFp8MoEMethod(FusedMoEMethodBase): ...@@ -977,11 +977,11 @@ class ModelOptFp8MoEMethod(FusedMoEMethodBase):
assert self.moe_mk is not None assert self.moe_mk is not None
return self.moe_mk( return self.moe_mk(
x, hidden_states=x,
layer.w13_weight, w1=layer.w13_weight,
layer.w2_weight, w2=layer.w2_weight,
topk_weights, topk_weights=topk_weights,
topk_ids, topk_ids=topk_ids,
activation=layer.activation, activation=layer.activation,
global_num_experts=layer.global_num_experts, global_num_experts=layer.global_num_experts,
expert_map=layer.expert_map, expert_map=layer.expert_map,
...@@ -1549,11 +1549,11 @@ class ModelOptNvFp4FusedMoE(FusedMoEMethodBase): ...@@ -1549,11 +1549,11 @@ class ModelOptNvFp4FusedMoE(FusedMoEMethodBase):
else: else:
assert self.moe_mk is not None assert self.moe_mk is not None
return self.moe_mk( return self.moe_mk(
x, hidden_states=x,
layer.w13_weight, w1=layer.w13_weight,
layer.w2_weight, w2=layer.w2_weight,
topk_weights, topk_weights=topk_weights,
topk_ids, topk_ids=topk_ids,
activation=layer.activation, activation=layer.activation,
global_num_experts=layer.global_num_experts, global_num_experts=layer.global_num_experts,
expert_map=layer.expert_map, expert_map=layer.expert_map,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment