[UX] Bump version in CG memory profiling log message (#40465)

Signed-off-by: Matthew Bonanni <mbonanni@redhat.com>

[UX] Bump version in CG memory profiling log message (#40465)
Signed-off-by: Matthew Bonanni <mbonanni@redhat.com>
ab5666eb · Matthew Bonanni · GitHub · f819265a · ab5666eb
Unverified Commit ab5666eb authored Apr 21, 2026 by Matthew Bonanni Committed by GitHub Apr 21, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

vllm/v1/worker/gpu_worker.py vllm/v1/worker/gpu_worker.py +2 -2

No files found.
--- a/vllm/v1/worker/gpu_worker.py
+++ b/vllm/v1/worker/gpu_worker.py
@@ -456,7 +456,7 @@ class Worker(WorkerBase):
                logger.info(
                    "CUDA graph memory profiling is enabled "
                    "(VLLM_MEMORY_PROFILER_ESTIMATE_CUDAGRAPHS=1). "
-                    "This will become the default in v0.19. "
+                    "This will become the default in v0.21. "
                    "The current --gpu-memory-utilization=%.4f is equivalent "
                    "to --gpu-memory-utilization=%.4f without CUDA graph "
                    "memory profiling. To maintain the same effective KV "
@@ -472,7 +472,7 @@ class Worker(WorkerBase):
                    1.0,
                )
                logger.info(
-                    "In v0.19, CUDA graph memory profiling will be enabled "
+                    "In v0.21, CUDA graph memory profiling will be enabled "
                    "by default (VLLM_MEMORY_PROFILER_ESTIMATE_CUDAGRAPHS=1), "
                    "which more accurately accounts for CUDA graph memory "
                    "during KV cache allocation. To try it now, set "