Unverified Commit 98b8b3ab authored by Ning Xie's avatar Ning Xie Committed by GitHub
Browse files

[log] enable max_log_len trim only when needed (#31482)


Signed-off-by: default avatarAndy Xie <andy.xning@gmail.com>
parent 346e5645
# SPDX-License-Identifier: Apache-2.0 # SPDX-License-Identifier: Apache-2.0
# SPDX-FileCopyrightText: Copyright contributors to the vLLM project # SPDX-FileCopyrightText: Copyright contributors to the vLLM project
import logging
from collections.abc import Sequence from collections.abc import Sequence
import torch import torch
...@@ -26,23 +27,24 @@ class RequestLogger: ...@@ -26,23 +27,24 @@ class RequestLogger:
params: SamplingParams | PoolingParams | BeamSearchParams | None, params: SamplingParams | PoolingParams | BeamSearchParams | None,
lora_request: LoRARequest | None, lora_request: LoRARequest | None,
) -> None: ) -> None:
max_log_len = self.max_log_len if logger.isEnabledFor(logging.DEBUG):
if max_log_len is not None: max_log_len = self.max_log_len
if prompt is not None: if max_log_len is not None:
prompt = prompt[:max_log_len] if prompt is not None:
prompt = prompt[:max_log_len]
if prompt_token_ids is not None: if prompt_token_ids is not None:
prompt_token_ids = prompt_token_ids[:max_log_len] prompt_token_ids = prompt_token_ids[:max_log_len]
logger.debug( logger.debug(
"Request %s details: prompt: %r, " "Request %s details: prompt: %r, "
"prompt_token_ids: %s, " "prompt_token_ids: %s, "
"prompt_embeds shape: %s.", "prompt_embeds shape: %s.",
request_id, request_id,
prompt, prompt,
prompt_token_ids, prompt_token_ids,
prompt_embeds.shape if prompt_embeds is not None else None, prompt_embeds.shape if prompt_embeds is not None else None,
) )
logger.info( logger.info(
"Received request %s: params: %s, lora_request: %s.", "Received request %s: params: %s, lora_request: %s.",
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment