Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
02e8f26c
Unverified
Commit
02e8f26c
authored
Feb 17, 2026
by
Luka Govedič
Committed by
GitHub
Feb 18, 2026
Browse files
[torch.compile] Turn on silu+fp4 quant fusion by default for O1+ (#34718)
Signed-off-by:
Luka Govedič
<
lgovedic@redhat.com
>
parent
4a00a511
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
10 additions
and
5 deletions
+10
-5
vllm/config/vllm.py
vllm/config/vllm.py
+10
-5
No files found.
vllm/config/vllm.py
View file @
02e8f26c
...
...
@@ -95,11 +95,16 @@ def enable_norm_fusion(cfg: "VllmConfig") -> bool:
def
enable_act_fusion
(
cfg
:
"VllmConfig"
)
->
bool
:
"""Enable if either SiLU+Mul or quant FP8 custom op is active;
otherwise Inductor handles fusion."""
return
cfg
.
compilation_config
.
is_custom_op_enabled
(
"silu_and_mul"
)
or
cfg
.
compilation_config
.
is_custom_op_enabled
(
"quant_fp8"
)
"""
Enable if either SiLU+Mul or quant FP8 custom op is active;
otherwise Inductor handles fusion.
Also enable for FP4 models as FP4 quant is always custom so Inductor cannot fuse it.
"""
return
(
cfg
.
compilation_config
.
is_custom_op_enabled
(
"silu_and_mul"
)
or
cfg
.
compilation_config
.
is_custom_op_enabled
(
"quant_fp8"
)
or
(
cfg
.
model_config
is
not
None
and
cfg
.
model_config
.
is_nvfp4_quantized
())
)
def
enable_allreduce_rms_fusion
(
cfg
:
"VllmConfig"
)
->
bool
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment