Unverified Commit ebda73dc authored by Qiaolin Yu's avatar Qiaolin Yu Committed by GitHub
Browse files

Use cutlass fp4 gemm by default (#11813)

parent f4f8a1b4
......@@ -79,7 +79,7 @@ CUTEDSL_MOE_SCALAR_INPUT_SCALE = get_bool_env_var(
"SGLANG_CUTEDSL_MOE_SCALAR_INPUT_SCALE", "true"
)
USE_CUTLASS_BACKEND_FOR_FP4_GEMM = get_bool_env_var(
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM"
"SGLANG_USE_CUTLASS_BACKEND_FOR_FP4_GEMM", "true"
)
# TODO make it true by default when the DeepEP PR is merged
CUTEDSL_MOE_NVFP4_DISPATCH = get_bool_env_var(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment