Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
15a0b9e5
Unverified
Commit
15a0b9e5
authored
Feb 07, 2026
by
lukec
Committed by
GitHub
Feb 06, 2026
Browse files
Fix spelling errors (#33978)
parent
c490d8cc
Changes
5
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
10 additions
and
10 deletions
+10
-10
tests/kernels/moe/test_cutedsl_moe.py
tests/kernels/moe/test_cutedsl_moe.py
+1
-1
tests/kernels/moe/test_moe_align_block_size.py
tests/kernels/moe/test_moe_align_block_size.py
+1
-1
tests/reasoning/test_hunyuan_reasoning_parser.py
tests/reasoning/test_hunyuan_reasoning_parser.py
+3
-3
vllm/model_executor/layers/fused_moe/oracle/fp8.py
vllm/model_executor/layers/fused_moe/oracle/fp8.py
+1
-1
vllm/v1/attention/ops/flashmla.py
vllm/v1/attention/ops/flashmla.py
+4
-4
No files found.
tests/kernels/moe/test_cutedsl_moe.py
View file @
15a0b9e5
...
@@ -139,7 +139,7 @@ def prepare_inputs(
...
@@ -139,7 +139,7 @@ def prepare_inputs(
masked_m
.
append
(
mask
.
sum
())
masked_m
.
append
(
mask
.
sum
())
masked_m
=
torch
.
tensor
(
masked_m
,
dtype
=
torch
.
int32
)
masked_m
=
torch
.
tensor
(
masked_m
,
dtype
=
torch
.
int32
)
# Intialize the hidden_states_3d with ones instead of empty to avoid nan
# In
i
tialize the hidden_states_3d with ones instead of empty to avoid nan
# issue.
# issue.
hidden_states_3d
=
torch
.
ones
(
hidden_states_3d
=
torch
.
ones
(
(
num_experts
,
max
(
masked_m
),
hidden_states
.
shape
[
1
]),
dtype
=
hidden_states
.
dtype
(
num_experts
,
max
(
masked_m
),
hidden_states
.
shape
[
1
]),
dtype
=
hidden_states
.
dtype
...
...
tests/kernels/moe/test_moe_align_block_size.py
View file @
15a0b9e5
...
@@ -334,7 +334,7 @@ def test_batched_moe_align_block_size(
...
@@ -334,7 +334,7 @@ def test_batched_moe_align_block_size(
ref_expert_ids
=
torch
.
empty
((
Msum
//
block_size
,),
dtype
=
torch
.
int32
)
ref_expert_ids
=
torch
.
empty
((
Msum
//
block_size
,),
dtype
=
torch
.
int32
)
ref_num_tokens_post_pad
=
torch
.
empty
((
1
,),
dtype
=
torch
.
int32
)
ref_num_tokens_post_pad
=
torch
.
empty
((
1
,),
dtype
=
torch
.
int32
)
# Intialize
# In
i
tialize
sentinel
=
E
*
max_tokens_per_batch
sentinel
=
E
*
max_tokens_per_batch
ref_sorted_ids
.
fill_
(
sentinel
)
ref_sorted_ids
.
fill_
(
sentinel
)
ref_expert_ids
.
fill_
(
-
1
)
ref_expert_ids
.
fill_
(
-
1
)
...
...
tests/reasoning/test_hunyuan_reasoning_parser.py
View file @
15a0b9e5
...
@@ -12,7 +12,7 @@ START_REASONING = "<think>\n"
...
@@ -12,7 +12,7 @@ START_REASONING = "<think>\n"
START_RESPONSE
=
"
\n
</think>
\n
<answer>
\n
"
START_RESPONSE
=
"
\n
</think>
\n
<answer>
\n
"
END_RESPONSE
=
"
\n
</answer>"
END_RESPONSE
=
"
\n
</answer>"
NO_REASONING_QUICK_TH
R
OUGHT
=
{
NO_REASONING_QUICK_THOUGHT
=
{
"output"
:
f
"
{
START_REASONING
}{
START_RESPONSE
}
This is the rest
{
END_RESPONSE
}
"
,
# noqa: E501
"output"
:
f
"
{
START_REASONING
}{
START_RESPONSE
}
This is the rest
{
END_RESPONSE
}
"
,
# noqa: E501
"reasoning"
:
None
,
"reasoning"
:
None
,
"content"
:
"This is the rest"
,
"content"
:
"This is the rest"
,
...
@@ -81,7 +81,7 @@ TEST_CASES = [
...
@@ -81,7 +81,7 @@ TEST_CASES = [
NO_REASONING
,
NO_REASONING
,
id
=
"no_reasoning"
,
id
=
"no_reasoning"
,
),
),
pytest
.
param
(
False
,
NO_REASONING_QUICK_TH
R
OUGHT
,
id
=
"no_reasoning_quick"
),
pytest
.
param
(
False
,
NO_REASONING_QUICK_THOUGHT
,
id
=
"no_reasoning_quick"
),
pytest
.
param
(
pytest
.
param
(
False
,
False
,
MULTIPLE_LINES
,
MULTIPLE_LINES
,
...
@@ -117,7 +117,7 @@ TEST_CASES = [
...
@@ -117,7 +117,7 @@ TEST_CASES = [
NO_REASONING
,
NO_REASONING
,
id
=
"no_reasoning_streaming"
,
id
=
"no_reasoning_streaming"
,
),
),
pytest
.
param
(
True
,
NO_REASONING_QUICK_TH
R
OUGHT
,
id
=
"no_reasoning_quick_stream"
),
pytest
.
param
(
True
,
NO_REASONING_QUICK_THOUGHT
,
id
=
"no_reasoning_quick_stream"
),
pytest
.
param
(
pytest
.
param
(
True
,
True
,
MULTIPLE_LINES
,
MULTIPLE_LINES
,
...
...
vllm/model_executor/layers/fused_moe/oracle/fp8.py
View file @
15a0b9e5
...
@@ -333,7 +333,7 @@ def select_fp8_moe_backend(
...
@@ -333,7 +333,7 @@ def select_fp8_moe_backend(
# TODO(rob): per discussion with TPU team, we need a way to register
# TODO(rob): per discussion with TPU team, we need a way to register
# MoE backends by OOT plugins, rather than having an explicit list
# MoE backends by OOT plugins, rather than having an explicit list
# of AVAILBLE_BACKENDS. Enabling returning `Fp8MoeBackend.NONE` is
# of AVAIL
A
BLE_BACKENDS. Enabling returning `Fp8MoeBackend.NONE` is
# a temporary measure until these register APIs are complete.
# a temporary measure until these register APIs are complete.
if
current_platform
.
is_cuda
()
or
current_platform
.
is_rocm
():
if
current_platform
.
is_cuda
()
or
current_platform
.
is_rocm
():
raise
NotImplementedError
(
raise
NotImplementedError
(
...
...
vllm/v1/attention/ops/flashmla.py
View file @
15a0b9e5
...
@@ -52,8 +52,8 @@ def is_flashmla_dense_supported() -> tuple[bool, str | None]:
...
@@ -52,8 +52,8 @@ def is_flashmla_dense_supported() -> tuple[bool, str | None]:
"""
"""
Return: is_supported_flag, unsupported_reason (optional).
Return: is_supported_flag, unsupported_reason (optional).
"""
"""
is_availble
,
maybe_reason
=
_is_flashmla_available
()
is_avail
a
ble
,
maybe_reason
=
_is_flashmla_available
()
if
not
is_availble
:
if
not
is_avail
a
ble
:
return
False
,
maybe_reason
return
False
,
maybe_reason
if
not
current_platform
.
is_device_capability_family
(
90
):
if
not
current_platform
.
is_device_capability_family
(
90
):
return
False
,
"FlashMLA Dense is only supported on Hopper devices."
return
False
,
"FlashMLA Dense is only supported on Hopper devices."
...
@@ -64,8 +64,8 @@ def is_flashmla_sparse_supported() -> tuple[bool, str | None]:
...
@@ -64,8 +64,8 @@ def is_flashmla_sparse_supported() -> tuple[bool, str | None]:
"""
"""
Return: is_supported_flag, unsupported_reason (optional).
Return: is_supported_flag, unsupported_reason (optional).
"""
"""
is_availble
,
maybe_reason
=
_is_flashmla_available
()
is_avail
a
ble
,
maybe_reason
=
_is_flashmla_available
()
if
not
is_availble
:
if
not
is_avail
a
ble
:
return
False
,
maybe_reason
return
False
,
maybe_reason
if
not
(
if
not
(
current_platform
.
is_device_capability_family
(
90
)
current_platform
.
is_device_capability_family
(
90
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment