Unverified Commit 6b2fa3a7 authored by Robert Shaw's avatar Robert Shaw Committed by GitHub
Browse files

[MoE] Move FlashInfer CuteDSL experts into fused_moe/experts/ (#37759)


Signed-off-by: default avatarRobert Shaw <robertgshaw2@gmail.com>
parent eeee5b26
......@@ -17,7 +17,7 @@ from flashinfer import fp4_quantize
from torch.nn import functional as F
from vllm.model_executor.layers.activation import SiluAndMul
from vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe import (
from vllm.model_executor.layers.fused_moe.experts.flashinfer_cutedsl_moe import (
flashinfer_cutedsl_moe_masked,
)
from vllm.utils.flashinfer import (
......
......@@ -86,7 +86,7 @@ def backend_to_kernel_cls(
return [FlashInferExperts]
elif backend == NvFp4MoeBackend.FLASHINFER_CUTEDSL:
from vllm.model_executor.layers.fused_moe.flashinfer_cutedsl_moe import (
from vllm.model_executor.layers.fused_moe.experts.flashinfer_cutedsl_moe import ( # noqa: E501
FlashInferCuteDSLExperts,
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment