[Misc] improve logits processors logging message (#7435)

97a6be95 · Andrew Wang · GitHub · 9ba85bc1 · 97a6be95 · 97a6be95
Unverified Commit 97a6be95 authored Aug 12, 2024 by Andrew Wang Committed by GitHub Aug 13, 2024
Showing with 1 addition and 2 deletions

tests/entrypoints/openai/test_serving_chat.py tests/entrypoints/openai/test_serving_chat.py +0 -1

vllm/entrypoints/openai/logits_processors.py vllm/entrypoints/openai/logits_processors.py +1 -1

No files found.
--- a/tests/entrypoints/openai/test_serving_chat.py
+++ b/tests/entrypoints/openai/test_serving_chat.py
@@ -73,7 +73,6 @@ def test_serving_chat_should_set_correct_max_tokens():
    with suppress(Exception):
        asyncio.run(serving_chat.create_chat_completion(req))
-    # AsyncLLMEngine.generate(inputs, sampling_params, ...)
    assert mock_engine.generate.call_args.args[1].max_tokens == 93
    req.max_tokens = 10

--- a/vllm/entrypoints/openai/logits_processors.py
+++ b/vllm/entrypoints/openai/logits_processors.py
@@ -71,7 +71,7 @@ def get_logits_processors(
        # Check if token_id is within the vocab size
        for token_id, bias in clamped_logit_bias.items():
            if token_id < 0 or token_id >= tokenizer.vocab_size:
-                raise ValueError("token_id in logit_bias contains "
+                raise ValueError(f"token_id {token_id} in logit_bias contains "
                                 "out-of-vocab token id")
        logits_processors.append(