Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
8548cf87
Commit
8548cf87
authored
Dec 15, 2025
by
zhuwenwen
Browse files
set VLLM_USE_LIGHTOP_FILL_MOE_ALIGN=0 when use dpsk-v3 non-quantitative
parent
a1314cac
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
4 additions
and
5 deletions
+4
-5
vllm/model_executor/model_loader/utils.py
vllm/model_executor/model_loader/utils.py
+4
-5
No files found.
vllm/model_executor/model_loader/utils.py
View file @
8548cf87
...
...
@@ -251,8 +251,6 @@ def get_model_architecture(
os
.
environ
[
'VLLM_USE_LIGHTOP_MOE_SUM_MUL_ADD'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_OPT_CAT"
):
os
.
environ
[
'VLLM_USE_OPT_CAT'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_LIGHTOP_FILL_MOE_ALIGN"
):
os
.
environ
[
'VLLM_USE_LIGHTOP_FILL_MOE_ALIGN'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_CAT_MLA"
):
os
.
environ
[
'VLLM_USE_CAT_MLA'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_REJECT_SAMPLE_OPT"
):
...
...
@@ -266,6 +264,8 @@ def get_model_architecture(
os
.
environ
[
'USE_FUSED_RMS_QUANT'
]
=
'1'
if
not
envs
.
is_set
(
"USE_FUSED_SILU_MUL_QUANT"
):
os
.
environ
[
'USE_FUSED_SILU_MUL_QUANT'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_LIGHTOP_FILL_MOE_ALIGN"
):
os
.
environ
[
'VLLM_USE_LIGHTOP_FILL_MOE_ALIGN'
]
=
'1'
else
:
if
not
envs
.
is_set
(
"VLLM_USE_PD_SPLIT"
):
os
.
environ
[
'VLLM_USE_PD_SPLIT'
]
=
'1'
...
...
@@ -296,8 +296,6 @@ def get_model_architecture(
os
.
environ
[
'VLLM_USE_LIGHTOP_MOE_SUM_MUL_ADD'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_OPT_CAT"
):
os
.
environ
[
'VLLM_USE_OPT_CAT'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_LIGHTOP_FILL_MOE_ALIGN"
):
os
.
environ
[
'VLLM_USE_LIGHTOP_FILL_MOE_ALIGN'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_CAT_MLA"
):
os
.
environ
[
'VLLM_USE_CAT_MLA'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_REJECT_SAMPLE_OPT"
):
...
...
@@ -307,11 +305,12 @@ def get_model_architecture(
if
not
envs
.
is_set
(
"VLLM_SCHED_ENABLE_MINIMAL_INJECTION"
):
os
.
environ
[
'VLLM_SCHED_ENABLE_MINIMAL_INJECTION'
]
=
'1'
if
model_config
.
quantization
in
{
"slimquant_w4a8"
,
"slimquant_w4a8_marlin"
,
"slimquant_compressed_tensors_marlin"
,
"compressed-tensors"
}:
if
not
envs
.
is_set
(
"USE_FUSED_RMS_QUANT"
):
os
.
environ
[
'USE_FUSED_RMS_QUANT'
]
=
'1'
if
not
envs
.
is_set
(
"USE_FUSED_SILU_MUL_QUANT"
):
os
.
environ
[
'USE_FUSED_SILU_MUL_QUANT'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_LIGHTOP_FILL_MOE_ALIGN"
):
os
.
environ
[
'VLLM_USE_LIGHTOP_FILL_MOE_ALIGN'
]
=
'1'
else
:
if
not
envs
.
is_set
(
"VLLM_USE_PD_SPLIT"
):
os
.
environ
[
'VLLM_USE_PD_SPLIT'
]
=
'1'
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment