Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
cc7f22a8
Commit
cc7f22a8
authored
Jun 11, 2025
by
zhuwenwen
Browse files
Merge tag 'v0.9.1' into v0.9.1-ori
parents
b9ea0c09
b6553be1
Changes
1000
Hide whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
36 additions
and
3 deletions
+36
-3
tests/distributed/test_expert_parallel.py
tests/distributed/test_expert_parallel.py
+1
-0
tests/distributed/test_multi_node_assignment.py
tests/distributed/test_multi_node_assignment.py
+1
-0
tests/distributed/test_pipeline_parallel.py
tests/distributed/test_pipeline_parallel.py
+2
-0
tests/distributed/test_pipeline_partition.py
tests/distributed/test_pipeline_partition.py
+1
-0
tests/distributed/test_pp_cudagraph.py
tests/distributed/test_pp_cudagraph.py
+1
-0
tests/distributed/test_pynccl.py
tests/distributed/test_pynccl.py
+1
-0
tests/distributed/test_same_node.py
tests/distributed/test_same_node.py
+1
-0
tests/distributed/test_sequence_parallel.py
tests/distributed/test_sequence_parallel.py
+1
-0
tests/distributed/test_shm_broadcast.py
tests/distributed/test_shm_broadcast.py
+1
-0
tests/distributed/test_torchrun_example.py
tests/distributed/test_torchrun_example.py
+1
-0
tests/distributed/test_utils.py
tests/distributed/test_utils.py
+1
-0
tests/encoder_decoder/test_e2e_correctness.py
tests/encoder_decoder/test_e2e_correctness.py
+1
-0
tests/engine/conftest.py
tests/engine/conftest.py
+1
-0
tests/engine/test_arg_utils.py
tests/engine/test_arg_utils.py
+16
-3
tests/engine/test_computed_prefix_blocks.py
tests/engine/test_computed_prefix_blocks.py
+1
-0
tests/engine/test_executor.py
tests/engine/test_executor.py
+1
-0
tests/engine/test_multi_step_output_processor.py
tests/engine/test_multi_step_output_processor.py
+1
-0
tests/engine/test_multiproc_workers.py
tests/engine/test_multiproc_workers.py
+1
-0
tests/engine/test_options.py
tests/engine/test_options.py
+1
-0
tests/engine/test_short_mm_context.py
tests/engine/test_short_mm_context.py
+1
-0
No files found.
Too many changes to show.
To preserve performance only
1000 of 1000+
files are displayed.
Plain diff
Email patch
tests/distributed/test_expert_parallel.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from
dataclasses
import
dataclass
from
dataclasses
import
dataclass
from
typing
import
Literal
,
NamedTuple
,
Optional
from
typing
import
Literal
,
NamedTuple
,
Optional
...
...
tests/distributed/test_multi_node_assignment.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""Make sure ray assigns GPU workers to the correct node.
"""Make sure ray assigns GPU workers to the correct node.
Run:
Run:
...
...
tests/distributed/test_pipeline_parallel.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""
"""
WARNING: This test runs in both single-node (4 GPUs) and multi-node
WARNING: This test runs in both single-node (4 GPUs) and multi-node
(2 node with 2 GPUs each) modes. If the test only uses 2 GPUs, it is
(2 node with 2 GPUs each) modes. If the test only uses 2 GPUs, it is
...
@@ -227,6 +228,7 @@ MULTIMODAL_MODELS = {
...
@@ -227,6 +228,7 @@ MULTIMODAL_MODELS = {
"llava-hf/llava-onevision-qwen2-0.5b-ov-hf"
:
PPTestSettings
.
fast
(),
"llava-hf/llava-onevision-qwen2-0.5b-ov-hf"
:
PPTestSettings
.
fast
(),
"openbmb/MiniCPM-Llama3-V-2_5"
:
PPTestSettings
.
fast
(),
"openbmb/MiniCPM-Llama3-V-2_5"
:
PPTestSettings
.
fast
(),
"allenai/Molmo-7B-D-0924"
:
PPTestSettings
.
fast
(),
"allenai/Molmo-7B-D-0924"
:
PPTestSettings
.
fast
(),
"AIDC-AI/Ovis2-1B"
:
PPTestSettings
.
fast
(),
"microsoft/Phi-3.5-vision-instruct"
:
PPTestSettings
.
fast
(),
"microsoft/Phi-3.5-vision-instruct"
:
PPTestSettings
.
fast
(),
"mistralai/Pixtral-12B-2409"
:
PPTestSettings
.
fast
(
load_format
=
"dummy"
),
"mistralai/Pixtral-12B-2409"
:
PPTestSettings
.
fast
(
load_format
=
"dummy"
),
"Qwen/Qwen-VL-Chat"
:
PPTestSettings
.
fast
(),
"Qwen/Qwen-VL-Chat"
:
PPTestSettings
.
fast
(),
...
...
tests/distributed/test_pipeline_partition.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
os
import
os
...
...
tests/distributed/test_pp_cudagraph.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from
__future__
import
annotations
from
__future__
import
annotations
from
typing
import
TYPE_CHECKING
from
typing
import
TYPE_CHECKING
...
...
tests/distributed/test_pynccl.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
multiprocessing
import
multiprocessing
import
os
import
os
...
...
tests/distributed/test_same_node.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
os
import
os
...
...
tests/distributed/test_sequence_parallel.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""
"""
WARNING: This test runs in both single-node (4 GPUs) and multi-node
WARNING: This test runs in both single-node (4 GPUs) and multi-node
(2 node with 2 GPUs each) modes. If the test only uses 2 GPUs, it is
(2 node with 2 GPUs each) modes. If the test only uses 2 GPUs, it is
...
...
tests/distributed/test_shm_broadcast.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
multiprocessing
import
multiprocessing
import
random
import
random
...
...
tests/distributed/test_torchrun_example.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
# unit test for `examples/offline_inference/torchrun_example.py`
# unit test for `examples/offline_inference/torchrun_example.py`
import
os
import
os
...
...
tests/distributed/test_utils.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
socket
import
socket
...
...
tests/encoder_decoder/test_e2e_correctness.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
"""E2E tests to verify the correctness of the encoder-decoder framework
"""E2E tests to verify the correctness of the encoder-decoder framework
Run `pytest tests/encoder_decoder/test_e2e_correctness.py`.
Run `pytest tests/encoder_decoder/test_e2e_correctness.py`.
...
...
tests/engine/conftest.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
...
...
tests/engine/test_arg_utils.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
json
import
json
from
argparse
import
ArgumentError
,
ArgumentTypeError
from
argparse
import
ArgumentError
,
ArgumentTypeError
from
contextlib
import
nullcontext
from
contextlib
import
nullcontext
from
dataclasses
import
dataclass
,
field
from
dataclasses
import
dataclass
,
field
from
typing
import
Literal
,
Optional
from
typing
import
Annotated
,
Literal
,
Optional
import
pytest
import
pytest
from
vllm.config
import
CompilationConfig
,
config
from
vllm.config
import
CompilationConfig
,
config
from
vllm.engine.arg_utils
import
(
EngineArgs
,
contains_type
,
get_kwargs
,
from
vllm.engine.arg_utils
import
(
EngineArgs
,
contains_type
,
get_kwargs
,
get_type
,
is_not_builtin
,
is_type
,
get_type
,
get_type_hints
,
is_not_builtin
,
literal_to_kwargs
,
nullable_kvs
,
is_type
,
literal_to_kwargs
,
nullable_kvs
,
optional_type
,
parse_type
)
optional_type
,
parse_type
)
from
vllm.utils
import
FlexibleArgumentParser
from
vllm.utils
import
FlexibleArgumentParser
...
@@ -159,6 +160,18 @@ def test_is_not_builtin(type_hint, expected):
...
@@ -159,6 +160,18 @@ def test_is_not_builtin(type_hint, expected):
assert
is_not_builtin
(
type_hint
)
==
expected
assert
is_not_builtin
(
type_hint
)
==
expected
@
pytest
.
mark
.
parametrize
(
(
"type_hint"
,
"expected"
),
[
(
Annotated
[
int
,
"annotation"
],
{
int
}),
(
Optional
[
int
],
{
int
,
type
(
None
)}),
(
Annotated
[
Optional
[
int
],
"annotation"
],
{
int
,
type
(
None
)}),
(
Optional
[
Annotated
[
int
,
"annotation"
]],
{
int
,
type
(
None
)}),
],
ids
=
[
"Annotated"
,
"Optional"
,
"Annotated_Optional"
,
"Optional_Annotated"
])
def
test_get_type_hints
(
type_hint
,
expected
):
assert
get_type_hints
(
type_hint
)
==
expected
def
test_get_kwargs
():
def
test_get_kwargs
():
kwargs
=
get_kwargs
(
DummyConfig
)
kwargs
=
get_kwargs
(
DummyConfig
)
print
(
kwargs
)
print
(
kwargs
)
...
...
tests/engine/test_computed_prefix_blocks.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
...
...
tests/engine/test_executor.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
asyncio
import
asyncio
import
os
import
os
...
...
tests/engine/test_multi_step_output_processor.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
random
import
random
from
unittest.mock
import
MagicMock
from
unittest.mock
import
MagicMock
...
...
tests/engine/test_multiproc_workers.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
asyncio
import
asyncio
from
concurrent.futures
import
ThreadPoolExecutor
from
concurrent.futures
import
ThreadPoolExecutor
...
...
tests/engine/test_options.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
from
contextlib
import
nullcontext
from
contextlib
import
nullcontext
import
pytest
import
pytest
...
...
tests/engine/test_short_mm_context.py
View file @
cc7f22a8
# SPDX-License-Identifier: Apache-2.0
# SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import
pytest
import
pytest
...
...
Prev
1
…
12
13
14
15
16
17
18
19
20
…
50
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment