Unverified Commit 67a746e8 authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files

[Log] Optimize duplicate startup log (#33944)


Signed-off-by: default avataryewentao256 <zhyanwentao@126.com>
parent 7bec4351
...@@ -263,11 +263,12 @@ class CompilerManager: ...@@ -263,11 +263,12 @@ class CompilerManager:
now = time.time() now = time.time()
elapsed = now - compilation_start_time elapsed = now - compilation_start_time
compilation_config.compilation_time += elapsed compilation_config.compilation_time += elapsed
logger.info( logger.info_once(
"Directly load the compiled graph(s) for compile range %s " "Directly load the compiled graph(s) for compile range %s "
"from the cache, took %.3f s", "from the cache, took %.3f s",
str(compile_range), str(compile_range),
elapsed, elapsed,
scope="local",
) )
return compiled_graph return compiled_graph
......
...@@ -91,14 +91,16 @@ def is_deep_gemm_e8m0_used() -> bool: ...@@ -91,14 +91,16 @@ def is_deep_gemm_e8m0_used() -> bool:
_lazy_init() _lazy_init()
if _fp8_gemm_nt_impl is None: if _fp8_gemm_nt_impl is None:
logger.info_once("DeepGEMM E8M0 disabled: _fp8_gemm_nt_impl not found") logger.info_once(
"DeepGEMM E8M0 disabled: _fp8_gemm_nt_impl not found", scope="local"
)
return False return False
if envs.VLLM_USE_DEEP_GEMM_E8M0: if envs.VLLM_USE_DEEP_GEMM_E8M0:
logger.info_once("DeepGEMM E8M0 enabled on current platform.") logger.info_once("DeepGEMM E8M0 enabled on current platform.", scope="local")
return True return True
logger.info_once("DeepGEMM E8M0 disabled on current configuration.") logger.info_once("DeepGEMM E8M0 disabled on current configuration.", scope="local")
return False return False
......
...@@ -119,9 +119,6 @@ class Worker(WorkerBase): ...@@ -119,9 +119,6 @@ class Worker(WorkerBase):
self.use_v2_model_runner = envs.VLLM_USE_V2_MODEL_RUNNER self.use_v2_model_runner = envs.VLLM_USE_V2_MODEL_RUNNER
if self.use_v2_model_runner:
logger.info_once("Using V2 Model Runner", scope="global")
def sleep(self, level: int = 1) -> None: def sleep(self, level: int = 1) -> None:
from vllm.device_allocator.cumem import CuMemAllocator from vllm.device_allocator.cumem import CuMemAllocator
...@@ -240,6 +237,9 @@ class Worker(WorkerBase): ...@@ -240,6 +237,9 @@ class Worker(WorkerBase):
current_platform.dist_backend, current_platform.dist_backend,
) )
if self.use_v2_model_runner:
logger.info_once("Using V2 Model Runner", scope="local")
# Set random seed. # Set random seed.
set_random_seed(self.model_config.seed) set_random_seed(self.model_config.seed)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment