Unverified Commit 4d16c88b authored by Elfie Guo's avatar Elfie Guo Committed by GitHub
Browse files

Update cutlass_moe.py (#8535)

parent 7a4309cc
...@@ -209,7 +209,8 @@ def cutlass_fused_experts_fp8( ...@@ -209,7 +209,8 @@ def cutlass_fused_experts_fp8(
) )
result = torch.empty((m, k), device=device, dtype=out_dtype) result = torch.empty((m, k), device=device, dtype=out_dtype)
return apply_shuffle_mul_sum(c2, result, c_map, topk_weights) apply_shuffle_mul_sum(c2, result, c_map, topk_weights)
return result
FLOAT4_E2M1_MAX = 6.0 FLOAT4_E2M1_MAX = 6.0
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment