Unverified Commit c42dc402 authored by Boyuan Feng's avatar Boyuan Feng Committed by GitHub
Browse files

clean unused cudagraph_batch_sizes (#35552)


Signed-off-by: default avatarBoyuan Feng <boyuan@meta.com>
parent fa6a6be5
...@@ -597,15 +597,6 @@ class GPUModelRunner( ...@@ -597,15 +597,6 @@ class GPUModelRunner(
self.async_output_copy_stream = torch.cuda.Stream() self.async_output_copy_stream = torch.cuda.Stream()
self.prepare_inputs_event = torch.Event() self.prepare_inputs_event = torch.Event()
# self.cudagraph_batch_sizes sorts in ascending order.
if (
self.compilation_config.cudagraph_capture_sizes
and self.compilation_config.cudagraph_mode != CUDAGraphMode.NONE
):
self.cudagraph_batch_sizes = sorted(
self.compilation_config.cudagraph_capture_sizes
)
# Cache the device properties. # Cache the device properties.
self._init_device_properties() self._init_device_properties()
...@@ -5705,10 +5696,6 @@ class GPUModelRunner( ...@@ -5705,10 +5696,6 @@ class GPUModelRunner(
self.compilation_config.adjust_cudagraph_sizes_for_spec_decode( self.compilation_config.adjust_cudagraph_sizes_for_spec_decode(
self.uniform_decode_query_len, self.parallel_config.tensor_parallel_size self.uniform_decode_query_len, self.parallel_config.tensor_parallel_size
) )
capture_sizes = self.compilation_config.cudagraph_capture_sizes
self.cudagraph_batch_sizes = (
capture_sizes if capture_sizes is not None else []
)
# Trigger cudagraph dispatching keys initialization after # Trigger cudagraph dispatching keys initialization after
# resolved cudagraph mode. # resolved cudagraph mode.
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment