Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
86d92eb9
Commit
86d92eb9
authored
Oct 23, 2025
by
zhuwenwen
Browse files
update test_moe.py
set USE_FUSED_RMS_QUANT=1 and USE_FUSED_SILU_MUL_QUANT=1
parent
6f1db287
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
7 additions
and
3 deletions
+7
-3
tests/kernels/moe/test_moe.py
tests/kernels/moe/test_moe.py
+3
-3
vllm/model_executor/model_loader/utils.py
vllm/model_executor/model_loader/utils.py
+4
-0
No files found.
tests/kernels/moe/test_moe.py
View file @
86d92eb9
...
...
@@ -114,9 +114,9 @@ def run_moe_test(
return
baseline_output
@
pytest
.
mark
.
parametrize
(
"m"
,
[
1
,
33
,
64
,
222
,
32768
,
40000
])
@
pytest
.
mark
.
parametrize
(
"m"
,
[
1
,
33
,
64
,
32768
,
40000
])
@
pytest
.
mark
.
parametrize
(
"n"
,
[
128
,
1024
,
2048
])
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
51
1
,
1024
])
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
51
2
,
1024
])
@
pytest
.
mark
.
parametrize
(
"e"
,
NUM_EXPERTS
)
@
pytest
.
mark
.
parametrize
(
"topk"
,
TOP_KS
)
@
pytest
.
mark
.
parametrize
(
"ep_size"
,
EP_SIZE
)
...
...
@@ -734,7 +734,7 @@ def test_moe_align_block_size_opcheck():
@
pytest
.
mark
.
parametrize
(
"m"
,
[
1
,
33
,
64
,
222
])
@
pytest
.
mark
.
parametrize
(
"topk"
,
TOP_KS
)
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
51
2
,
1024
])
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
51
1
,
1024
])
@
pytest
.
mark
.
parametrize
(
"dtype"
,
[
torch
.
float32
,
torch
.
float16
,
torch
.
bfloat16
])
@
pytest
.
mark
.
skipif
(
current_platform
.
is_rocm
(),
reason
=
"Skip for rocm"
)
...
...
vllm/model_executor/model_loader/utils.py
View file @
86d92eb9
...
...
@@ -260,6 +260,10 @@ def get_model_architecture(
os
.
environ
[
'VLLM_USE_LIGHTOP'
]
=
'1'
if
not
envs
.
is_set
(
"VLLM_USE_OPT_CAT"
):
os
.
environ
[
'VLLM_USE_OPT_CAT'
]
=
'1'
if
not
envs
.
is_set
(
"USE_FUSED_RMS_QUANT"
):
os
.
environ
[
'USE_FUSED_RMS_QUANT'
]
=
'1'
if
not
envs
.
is_set
(
"USE_FUSED_SILU_MUL_QUANT"
):
os
.
environ
[
'USE_FUSED_SILU_MUL_QUANT'
]
=
'1'
# awq相关配置
try
:
if
os
.
getenv
(
'AWQ_MOE_SZ'
)
==
None
:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment