Unverified Commit 67a746e8 authored by Wentao Ye's avatar Wentao Ye Committed by GitHub
Browse files

[Log] Optimize duplicate startup log (#33944)


Signed-off-by: default avataryewentao256 <zhyanwentao@126.com>
parent 7bec4351
......@@ -263,11 +263,12 @@ class CompilerManager:
now = time.time()
elapsed = now - compilation_start_time
compilation_config.compilation_time += elapsed
logger.info(
logger.info_once(
"Directly load the compiled graph(s) for compile range %s "
"from the cache, took %.3f s",
str(compile_range),
elapsed,
scope="local",
)
return compiled_graph
......
......@@ -91,14 +91,16 @@ def is_deep_gemm_e8m0_used() -> bool:
_lazy_init()
if _fp8_gemm_nt_impl is None:
logger.info_once("DeepGEMM E8M0 disabled: _fp8_gemm_nt_impl not found")
logger.info_once(
"DeepGEMM E8M0 disabled: _fp8_gemm_nt_impl not found", scope="local"
)
return False
if envs.VLLM_USE_DEEP_GEMM_E8M0:
logger.info_once("DeepGEMM E8M0 enabled on current platform.")
logger.info_once("DeepGEMM E8M0 enabled on current platform.", scope="local")
return True
logger.info_once("DeepGEMM E8M0 disabled on current configuration.")
logger.info_once("DeepGEMM E8M0 disabled on current configuration.", scope="local")
return False
......
......@@ -119,9 +119,6 @@ class Worker(WorkerBase):
self.use_v2_model_runner = envs.VLLM_USE_V2_MODEL_RUNNER
if self.use_v2_model_runner:
logger.info_once("Using V2 Model Runner", scope="global")
def sleep(self, level: int = 1) -> None:
from vllm.device_allocator.cumem import CuMemAllocator
......@@ -240,6 +237,9 @@ class Worker(WorkerBase):
current_platform.dist_backend,
)
if self.use_v2_model_runner:
logger.info_once("Using V2 Model Runner", scope="local")
# Set random seed.
set_random_seed(self.model_config.seed)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment