Unverified Commit e3f08c77 authored by Elfie Guo's avatar Elfie Guo Committed by GitHub
Browse files

Update cutlass_moe.py (#8545)

parent a9fd8033
......@@ -209,7 +209,7 @@ def cutlass_fused_experts_fp8(
)
result = torch.empty((m, k), device=device, dtype=out_dtype)
apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
apply_shuffle_mul_sum(c2, result, c_map, topk_weights.to(out_dtype))
return result
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment