Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
792a74b9
Unverified
Commit
792a74b9
authored
Mar 03, 2026
by
Cyrus Leung
Committed by
GitHub
Mar 02, 2026
Browse files
[Doc] Improve UX of `--enable-log-requests` (#35723)
Signed-off-by:
DarkLight1337
<
tlleungac@connect.ust.hk
>
parent
4034c3d3
Changes
5
Show whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
21 additions
and
11 deletions
+21
-11
benchmarks/auto_tune/auto_tune.sh
benchmarks/auto_tune/auto_tune.sh
+0
-1
benchmarks/multi_turn/README.md
benchmarks/multi_turn/README.md
+1
-1
vllm/engine/arg_utils.py
vllm/engine/arg_utils.py
+4
-8
vllm/entrypoints/logger.py
vllm/entrypoints/logger.py
+14
-0
vllm/entrypoints/openai/cli_args.py
vllm/entrypoints/openai/cli_args.py
+2
-1
No files found.
benchmarks/auto_tune/auto_tune.sh
View file @
792a74b9
...
@@ -85,7 +85,6 @@ start_server() {
...
@@ -85,7 +85,6 @@ start_server() {
# Each argument and its value are separate elements.
# Each argument and its value are separate elements.
local
common_args_array
=(
local
common_args_array
=(
"
$MODEL
"
"
$MODEL
"
"--disable-log-requests"
"--port"
"8004"
"--port"
"8004"
"--host"
"
$HOSTNAME
"
"--host"
"
$HOSTNAME
"
"--gpu-memory-utilization"
"
$gpu_memory_utilization
"
"--gpu-memory-utilization"
"
$gpu_memory_utilization
"
...
...
benchmarks/multi_turn/README.md
View file @
792a74b9
...
@@ -7,7 +7,7 @@ First start serving your model
...
@@ -7,7 +7,7 @@ First start serving your model
```
bash
```
bash
export
MODEL_PATH
=
/models/meta-llama/Meta-Llama-3.1-8B-Instruct/
export
MODEL_PATH
=
/models/meta-llama/Meta-Llama-3.1-8B-Instruct/
vllm serve
$MODEL_PATH
--served-model-name
Llama
--disable-log-requests
vllm serve
$MODEL_PATH
--served-model-name
Llama
```
```
The variable
`MODEL_PATH`
should be a path to the model files (e.g. downloaded from huggingface).
The variable
`MODEL_PATH`
should be a path to the model files (e.g. downloaded from huggingface).
...
...
vllm/engine/arg_utils.py
View file @
792a74b9
...
@@ -2187,14 +2187,10 @@ class AsyncEngineArgs(EngineArgs):
...
@@ -2187,14 +2187,10 @@ class AsyncEngineArgs(EngineArgs):
"--enable-log-requests"
,
"--enable-log-requests"
,
action
=
argparse
.
BooleanOptionalAction
,
action
=
argparse
.
BooleanOptionalAction
,
default
=
AsyncEngineArgs
.
enable_log_requests
,
default
=
AsyncEngineArgs
.
enable_log_requests
,
help
=
"Enable logging requests."
,
help
=
"Enable logging request information, dependant on log level:
\n
"
)
"- INFO: Request ID, parameters and LoRA request.
\n
"
parser
.
add_argument
(
"- DEBUG: Prompt inputs (e.g: text, token IDs).
\n
"
"--disable-log-requests"
,
"You can set the minimum log level via `VLLM_LOGGING_LEVEL`."
,
action
=
argparse
.
BooleanOptionalAction
,
default
=
not
AsyncEngineArgs
.
enable_log_requests
,
help
=
"[DEPRECATED] Disable logging requests."
,
deprecated
=
True
,
)
)
current_platform
.
pre_register_and_update
(
parser
)
current_platform
.
pre_register_and_update
(
parser
)
return
parser
return
parser
...
...
vllm/entrypoints/logger.py
View file @
792a74b9
...
@@ -18,6 +18,20 @@ class RequestLogger:
...
@@ -18,6 +18,20 @@ class RequestLogger:
def
__init__
(
self
,
*
,
max_log_len
:
int
|
None
)
->
None
:
def
__init__
(
self
,
*
,
max_log_len
:
int
|
None
)
->
None
:
self
.
max_log_len
=
max_log_len
self
.
max_log_len
=
max_log_len
if
not
logger
.
isEnabledFor
(
logging
.
INFO
):
logger
.
warning_once
(
"`--enable-log-requests` is set but "
"the minimum log level is higher than INFO. "
"No request information will be logged."
)
elif
not
logger
.
isEnabledFor
(
logging
.
DEBUG
):
logger
.
info_once
(
"`--enable-log-requests` is set but "
"the minimum log level is higher than DEBUG. "
"Only limited information will be logged to minimize overhead. "
"To view more details, set `VLLM_LOGGING_LEVEL=DEBUG`."
)
def
log_inputs
(
def
log_inputs
(
self
,
self
,
request_id
:
str
,
request_id
:
str
,
...
...
vllm/entrypoints/openai/cli_args.py
View file @
792a74b9
...
@@ -143,7 +143,8 @@ class BaseFrontendArgs:
...
@@ -143,7 +143,8 @@ class BaseFrontendArgs:
templates and other tokenizer configuration."""
templates and other tokenizer configuration."""
enable_log_outputs
:
bool
=
False
enable_log_outputs
:
bool
=
False
"""If set to True, log model outputs (generations).
"""If set to True, log model outputs (generations).
Requires --enable-log-requests."""
Requires `--enable-log-requests`. As with `--enable-log-requests`,
information is only logged at INFO level at maximum."""
enable_log_deltas
:
bool
=
True
enable_log_deltas
:
bool
=
True
"""If set to False, output deltas will not be logged. Relevant only if
"""If set to False, output deltas will not be logged. Relevant only if
--enable-log-outputs is set.
--enable-log-outputs is set.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment