Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
4979eb79
Unverified
Commit
4979eb79
authored
Sep 15, 2025
by
Didier Durand
Committed by
GitHub
Sep 15, 2025
Browse files
[Doc]: fix typos in various files (#24821)
Signed-off-by:
Didier Durand
<
durand.didier@gmail.com
>
parent
a8c0f599
Changes
7
Show whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
7 additions
and
7 deletions
+7
-7
.buildkite/nightly-benchmarks/nightly-descriptions.md
.buildkite/nightly-benchmarks/nightly-descriptions.md
+1
-1
vllm/model_executor/layers/quantization/moe_wna16.py
vllm/model_executor/layers/quantization/moe_wna16.py
+1
-1
vllm/model_executor/layers/quantization/utils/marlin_utils_test.py
...l_executor/layers/quantization/utils/marlin_utils_test.py
+1
-1
vllm/model_executor/layers/sampler.py
vllm/model_executor/layers/sampler.py
+1
-1
vllm/model_executor/models/glm4_1v.py
vllm/model_executor/models/glm4_1v.py
+1
-1
vllm/model_executor/models/interns1.py
vllm/model_executor/models/interns1.py
+1
-1
vllm/model_executor/models/ultravox.py
vllm/model_executor/models/ultravox.py
+1
-1
No files found.
.buildkite/nightly-benchmarks/nightly-descriptions.md
View file @
4979eb79
...
...
@@ -8,7 +8,7 @@ This benchmark aims to:
Latest results:
[
results link
](
https://blog.vllm.ai/2024/09/05/perf-update.html
)
, scroll to the end.
Latest reproduction gui
l
de:
[
github issue link
](
https://github.com/vllm-project/vllm/issues/8176
)
Latest reproduction guide:
[
github issue link
](
https://github.com/vllm-project/vllm/issues/8176
)
## Setup
...
...
vllm/model_executor/layers/quantization/moe_wna16.py
View file @
4979eb79
...
...
@@ -190,7 +190,7 @@ class MoeWNA16Method(FusedMoEMethodBase):
group_size
=
self
.
quant_config
.
group_size
group_size_div_factor
=
1
# make intermediate_size and hidden_size divi
a
ble by group_size
# make intermediate_size and hidden_size divi
si
ble by group_size
# we reduce the group size to ensure that
# and we would repeat the loaded_weight later
while
intermediate_size_per_partition
%
group_size
or
\
...
...
vllm/model_executor/layers/quantization/utils/marlin_utils_test.py
View file @
4979eb79
...
...
@@ -19,7 +19,7 @@ class MarlinWorkspace:
def
__init__
(
self
,
out_features
,
min_thread_n
,
max_parallel
):
assert
(
out_features
%
min_thread_n
==
0
),
(
"out_features = {} is
u
ndivisible by min_thread_n = {}"
.
format
(
"out_features = {} is
i
ndivisible by min_thread_n = {}"
.
format
(
out_features
,
min_thread_n
))
max_workspace_size
=
((
out_features
//
min_thread_n
)
*
max_parallel
)
...
...
vllm/model_executor/layers/sampler.py
View file @
4979eb79
...
...
@@ -649,7 +649,7 @@ def _sample_with_torch(
else
:
sampled_token_ids_tensor
=
None
# Counterint
i
utively, having two loops here is actually faster.
# Counterintu
i
tively, having two loops here is actually faster.
# The first loop can run without waiting on GPU<->CPU sync.
for
sampling_type
in
SamplingType
:
sample_indices
=
categorized_sample_indices
[
sampling_type
]
...
...
vllm/model_executor/models/glm4_1v.py
View file @
4979eb79
...
...
@@ -1524,7 +1524,7 @@ class Glm4vForConditionalGeneration(nn.Module, SupportsMultiModal,
return
None
# The result multimodal_embeddings is tuple of tensors, with each
# tensor correspo
e
nding to a multimodal data item (image or video).
# tensor corresponding to a multimodal data item (image or video).
multimodal_embeddings
:
tuple
[
torch
.
Tensor
,
...]
=
()
# NOTE: It is important to iterate over the keys in this dictionary
...
...
vllm/model_executor/models/interns1.py
View file @
4979eb79
...
...
@@ -738,7 +738,7 @@ class InternS1ForConditionalGeneration(nn.Module, SupportsMultiModal,
return
[]
# The result multimodal_embeddings is tuple of tensors, with each
# tensor correspo
e
nding to a multimodal data item (image or video).
# tensor corresponding to a multimodal data item (image or video).
multimodal_embeddings
:
tuple
[
torch
.
Tensor
,
...]
=
()
# NOTE: It is important to iterate over the keys in this dictionary
...
...
vllm/model_executor/models/ultravox.py
View file @
4979eb79
...
...
@@ -662,7 +662,7 @@ def pad_and_concat_to_dim3(
max_len
=
max
(
f
.
shape
[
-
1
]
for
f
in
features
)
# Ensure all features have dim=3
features
=
[
f
.
view
(
-
1
,
*
f
.
shape
[
-
2
:])
for
f
in
features
]
# Pad and oncatenate:
# Pad and
c
oncatenate:
# [[B1, 80, M1], [B2, 80, M2]] -> [B1+B2, 80, max(M1, M2)]
features
=
[
F
.
pad
(
f
,
(
0
,
max_len
-
f
.
shape
[
-
1
]))
for
f
in
features
]
return
torch
.
cat
(
features
)
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment