Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
42b42824
Unverified
Commit
42b42824
authored
Dec 21, 2025
by
Kevin McKay
Committed by
GitHub
Dec 21, 2025
Browse files
[Misc] Fix grammar errors in comments and messages (#31115)
Signed-off-by:
c0de128
<
kevin.mckay@outlook.com
>
parent
ec58c10c
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
4 additions
and
4 deletions
+4
-4
tests/quantization/test_compressed_tensors.py
tests/quantization/test_compressed_tensors.py
+3
-3
vllm/attention/ops/merge_attn_states.py
vllm/attention/ops/merge_attn_states.py
+1
-1
No files found.
tests/quantization/test_compressed_tensors.py
View file @
42b42824
...
@@ -83,7 +83,7 @@ def test_compressed_tensors_w8a8_static_setup(vllm_runner, model_args):
...
@@ -83,7 +83,7 @@ def test_compressed_tensors_w8a8_static_setup(vllm_runner, model_args):
current_platform
.
is_rocm
()
current_platform
.
is_rocm
()
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
):
):
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support on ROCm."
)
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support
ed
on ROCm."
)
with
vllm_runner
(
model_path
,
enforce_eager
=
True
)
as
llm
:
with
vllm_runner
(
model_path
,
enforce_eager
=
True
)
as
llm
:
...
@@ -161,7 +161,7 @@ def test_compressed_tensors_w8a8_logprobs(
...
@@ -161,7 +161,7 @@ def test_compressed_tensors_w8a8_logprobs(
current_platform
.
is_rocm
()
current_platform
.
is_rocm
()
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
):
):
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support on ROCm."
)
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support
ed
on ROCm."
)
if
use_aiter
:
if
use_aiter
:
if
model_path
not
in
ROCM_AITER_SUPPORTED_INT8_MODEL
:
if
model_path
not
in
ROCM_AITER_SUPPORTED_INT8_MODEL
:
...
@@ -231,7 +231,7 @@ def test_compressed_tensors_w8a8_dynamic_per_token(
...
@@ -231,7 +231,7 @@ def test_compressed_tensors_w8a8_dynamic_per_token(
current_platform
.
is_rocm
()
current_platform
.
is_rocm
()
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
and
model_path
not
in
ROCM_TRITON_SCALED_MM_SUPPORTED_INT8_MODEL
):
):
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support on ROCm."
)
pytest
.
skip
(
f
"Skip model
{
model_path
}
as it is not support
ed
on ROCm."
)
if
use_aiter
:
if
use_aiter
:
if
model_path
not
in
ROCM_AITER_SUPPORTED_INT8_MODEL
:
if
model_path
not
in
ROCM_AITER_SUPPORTED_INT8_MODEL
:
...
...
vllm/attention/ops/merge_attn_states.py
View file @
42b42824
...
@@ -15,7 +15,7 @@ def merge_attn_states(
...
@@ -15,7 +15,7 @@ def merge_attn_states(
output_lse
:
torch
.
Tensor
|
None
=
None
,
output_lse
:
torch
.
Tensor
|
None
=
None
,
)
->
None
:
)
->
None
:
# NOTE(DefTruth): Currently, custom merge_attn_states CUDA kernel
# NOTE(DefTruth): Currently, custom merge_attn_states CUDA kernel
#
i
s not support
for
FP8 dtype, fallback to use Triton kernel.
#
doe
s not support FP8 dtype, fallback to use Triton kernel.
def
supported_dtypes
(
o
:
torch
.
Tensor
)
->
bool
:
def
supported_dtypes
(
o
:
torch
.
Tensor
)
->
bool
:
return
o
.
dtype
in
[
torch
.
float32
,
torch
.
half
,
torch
.
bfloat16
]
return
o
.
dtype
in
[
torch
.
float32
,
torch
.
half
,
torch
.
bfloat16
]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment