Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
048bb597
Unverified
Commit
048bb597
authored
Jan 14, 2026
by
Hongxia Yang
Committed by
GitHub
Jan 13, 2026
Browse files
AMD CI Test - unskip moe_sum test and moe_align_block_size tests (#32039)
Signed-off-by:
Hongxia Yang
<
hongxia.yang@amd.com
>
parent
79336380
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
11 additions
and
4 deletions
+11
-4
tests/kernels/moe/test_moe.py
tests/kernels/moe/test_moe.py
+0
-1
tests/kernels/moe/test_moe_align_block_size.py
tests/kernels/moe/test_moe_align_block_size.py
+0
-3
vllm/platforms/rocm.py
vllm/platforms/rocm.py
+11
-0
No files found.
tests/kernels/moe/test_moe.py
View file @
048bb597
...
@@ -1161,7 +1161,6 @@ def test_batched_moe_align_block_size_opcheck():
...
@@ -1161,7 +1161,6 @@ def test_batched_moe_align_block_size_opcheck():
@
pytest
.
mark
.
parametrize
(
"topk"
,
TOP_KS
)
@
pytest
.
mark
.
parametrize
(
"topk"
,
TOP_KS
)
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
511
,
1024
])
@
pytest
.
mark
.
parametrize
(
"k"
,
[
128
,
511
,
1024
])
@
pytest
.
mark
.
parametrize
(
"dtype"
,
[
torch
.
float32
,
torch
.
bfloat16
])
@
pytest
.
mark
.
parametrize
(
"dtype"
,
[
torch
.
float32
,
torch
.
bfloat16
])
@
pytest
.
mark
.
skipif
(
current_platform
.
is_rocm
(),
reason
=
"Skip for rocm"
)
def
test_moe_sum
(
m
:
int
,
topk
:
int
,
k
:
int
,
dtype
:
torch
.
dtype
):
def
test_moe_sum
(
m
:
int
,
topk
:
int
,
k
:
int
,
dtype
:
torch
.
dtype
):
input
=
torch
.
randn
((
m
,
topk
,
k
),
device
=
"cuda"
,
dtype
=
dtype
)
input
=
torch
.
randn
((
m
,
topk
,
k
),
device
=
"cuda"
,
dtype
=
dtype
)
actual
=
torch
.
empty
((
m
,
k
),
device
=
"cuda"
,
dtype
=
dtype
)
actual
=
torch
.
empty
((
m
,
k
),
device
=
"cuda"
,
dtype
=
dtype
)
...
...
tests/kernels/moe/test_moe_align_block_size.py
View file @
048bb597
...
@@ -12,7 +12,6 @@ from vllm.model_executor.layers.fused_moe.moe_align_block_size import (
...
@@ -12,7 +12,6 @@ from vllm.model_executor.layers.fused_moe.moe_align_block_size import (
batched_moe_align_block_size
,
batched_moe_align_block_size
,
moe_align_block_size
,
moe_align_block_size
,
)
)
from
vllm.platforms
import
current_platform
from
vllm.utils.math_utils
import
round_up
from
vllm.utils.math_utils
import
round_up
from
vllm.utils.torch_utils
import
set_random_seed
from
vllm.utils.torch_utils
import
set_random_seed
...
@@ -185,7 +184,6 @@ def torch_moe_align_block_size(
...
@@ -185,7 +184,6 @@ def torch_moe_align_block_size(
@
pytest
.
mark
.
parametrize
(
"num_experts"
,
NUM_EXPERTS
)
@
pytest
.
mark
.
parametrize
(
"num_experts"
,
NUM_EXPERTS
)
@
pytest
.
mark
.
parametrize
(
"block_size"
,
BLOCK_SIZES
)
@
pytest
.
mark
.
parametrize
(
"block_size"
,
BLOCK_SIZES
)
@
pytest
.
mark
.
parametrize
(
"pad_sorted_ids"
,
[
False
,
True
])
@
pytest
.
mark
.
parametrize
(
"pad_sorted_ids"
,
[
False
,
True
])
@
pytest
.
mark
.
skipif
(
current_platform
.
is_rocm
(),
reason
=
"Skip for rocm"
)
def
test_moe_align_block_size
(
def
test_moe_align_block_size
(
m
:
int
,
topk
:
int
,
num_experts
:
int
,
block_size
:
int
,
pad_sorted_ids
:
bool
m
:
int
,
topk
:
int
,
num_experts
:
int
,
block_size
:
int
,
pad_sorted_ids
:
bool
):
):
...
@@ -245,7 +243,6 @@ def test_moe_align_block_size(
...
@@ -245,7 +243,6 @@ def test_moe_align_block_size(
@
pytest
.
mark
.
parametrize
(
"topk"
,
[
2
,
4
])
@
pytest
.
mark
.
parametrize
(
"topk"
,
[
2
,
4
])
@
pytest
.
mark
.
parametrize
(
"num_experts"
,
[
8
,
64
])
@
pytest
.
mark
.
parametrize
(
"num_experts"
,
[
8
,
64
])
@
pytest
.
mark
.
parametrize
(
"block_size"
,
[
64
])
@
pytest
.
mark
.
parametrize
(
"block_size"
,
[
64
])
@
pytest
.
mark
.
skipif
(
current_platform
.
is_rocm
(),
reason
=
"Skip for rocm"
)
def
test_moe_align_block_size_with_expert_map
(
def
test_moe_align_block_size_with_expert_map
(
m
:
int
,
topk
:
int
,
num_experts
:
int
,
block_size
:
int
m
:
int
,
topk
:
int
,
num_experts
:
int
,
block_size
:
int
):
):
...
...
vllm/platforms/rocm.py
View file @
048bb597
...
@@ -187,6 +187,17 @@ class RocmPlatform(Platform):
...
@@ -187,6 +187,17 @@ class RocmPlatform(Platform):
if
not
on_gfx9
():
if
not
on_gfx9
():
supported_quantization
+=
[
"bitsandbytes"
]
supported_quantization
+=
[
"bitsandbytes"
]
@
classmethod
def
import_kernels
(
cls
)
->
None
:
"""Import ROCm-specific kernels."""
super
().
import_kernels
()
import
contextlib
# Import ROCm-specific extension
with
contextlib
.
suppress
(
ImportError
):
import
vllm._rocm_C
# noqa: F401
@
classmethod
@
classmethod
def
get_attn_backend_cls
(
def
get_attn_backend_cls
(
cls
,
cls
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment