"docs/source/api/schedulers/ddpm.mdx" did not exist on "5a38033de4824c8d5d9b2856776df45592a8e825"
Unverified Commit e3e75a78 authored by Cheng Wan's avatar Cheng Wan Committed by GitHub
Browse files

Fix the deprecation warning for enable_flashinfer_mxfp4_moe (#9214)

parent d4db9b02
......@@ -290,6 +290,7 @@ class ServerArgs:
enable_flashinfer_cutlass_moe: bool = False
enable_flashinfer_trtllm_moe: bool = False
enable_triton_kernel_moe: bool = False
enable_flashinfer_mxfp4_moe: bool = False
def __post_init__(self):
# Check deprecated arguments
......@@ -321,6 +322,11 @@ class ServerArgs:
print_deprecated_warning(
"NOTE: --enable-flashinfer-trtllm-moe is deprecated. Please set `--moe-runner-backend` to 'flashinfer_trtllm' instead."
)
if self.enable_flashinfer_mxfp4_moe:
self.moe_runner_backend = "flashinfer_mxfp4"
print_deprecated_warning(
"NOTE: --enable-flashinfer-mxfp4-moe is deprecated. Please set `--moe-runner-backend` to 'flashinfer_mxfp4' instead."
)
# Set missing default values
if self.tokenizer_path is None:
......@@ -1851,11 +1857,6 @@ class ServerArgs:
action="store_true",
help="Enable returning hidden states with responses.",
)
parser.add_argument(
"--enable-flashinfer-mxfp4-moe",
action="store_true",
help="Enable FlashInfer MXFP4 MoE backend for modelopt_fp4 quant on Blackwell.",
)
parser.add_argument(
"--scheduler-recv-interval",
type=int,
......@@ -2001,6 +2002,11 @@ class ServerArgs:
action="store_true",
help="(Deprecated) Use triton moe grouped gemm kernel.",
)
parser.add_argument(
"--enable-flashinfer-mxfp4-moe",
action="store_true",
help="(Deprecated) Enable FlashInfer MXFP4 MoE backend for modelopt_fp4 quant on Blackwell.",
)
@classmethod
def from_cli_args(cls, args: argparse.Namespace):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment