Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
c42dc402
Unverified
Commit
c42dc402
authored
Mar 02, 2026
by
Boyuan Feng
Committed by
GitHub
Mar 02, 2026
Browse files
clean unused cudagraph_batch_sizes (#35552)
Signed-off-by:
Boyuan Feng
<
boyuan@meta.com
>
parent
fa6a6be5
Changes
1
Show whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
0 additions
and
13 deletions
+0
-13
vllm/v1/worker/gpu_model_runner.py
vllm/v1/worker/gpu_model_runner.py
+0
-13
No files found.
vllm/v1/worker/gpu_model_runner.py
View file @
c42dc402
...
@@ -597,15 +597,6 @@ class GPUModelRunner(
...
@@ -597,15 +597,6 @@ class GPUModelRunner(
self
.
async_output_copy_stream
=
torch
.
cuda
.
Stream
()
self
.
async_output_copy_stream
=
torch
.
cuda
.
Stream
()
self
.
prepare_inputs_event
=
torch
.
Event
()
self
.
prepare_inputs_event
=
torch
.
Event
()
# self.cudagraph_batch_sizes sorts in ascending order.
if
(
self
.
compilation_config
.
cudagraph_capture_sizes
and
self
.
compilation_config
.
cudagraph_mode
!=
CUDAGraphMode
.
NONE
):
self
.
cudagraph_batch_sizes
=
sorted
(
self
.
compilation_config
.
cudagraph_capture_sizes
)
# Cache the device properties.
# Cache the device properties.
self
.
_init_device_properties
()
self
.
_init_device_properties
()
...
@@ -5705,10 +5696,6 @@ class GPUModelRunner(
...
@@ -5705,10 +5696,6 @@ class GPUModelRunner(
self
.
compilation_config
.
adjust_cudagraph_sizes_for_spec_decode
(
self
.
compilation_config
.
adjust_cudagraph_sizes_for_spec_decode
(
self
.
uniform_decode_query_len
,
self
.
parallel_config
.
tensor_parallel_size
self
.
uniform_decode_query_len
,
self
.
parallel_config
.
tensor_parallel_size
)
)
capture_sizes
=
self
.
compilation_config
.
cudagraph_capture_sizes
self
.
cudagraph_batch_sizes
=
(
capture_sizes
if
capture_sizes
is
not
None
else
[]
)
# Trigger cudagraph dispatching keys initialization after
# Trigger cudagraph dispatching keys initialization after
# resolved cudagraph mode.
# resolved cudagraph mode.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment