Unverified Commit 97a6be95 authored by Andrew Wang's avatar Andrew Wang Committed by GitHub
Browse files

[Misc] improve logits processors logging message (#7435)

parent 9ba85bc1
...@@ -73,7 +73,6 @@ def test_serving_chat_should_set_correct_max_tokens(): ...@@ -73,7 +73,6 @@ def test_serving_chat_should_set_correct_max_tokens():
with suppress(Exception): with suppress(Exception):
asyncio.run(serving_chat.create_chat_completion(req)) asyncio.run(serving_chat.create_chat_completion(req))
# AsyncLLMEngine.generate(inputs, sampling_params, ...)
assert mock_engine.generate.call_args.args[1].max_tokens == 93 assert mock_engine.generate.call_args.args[1].max_tokens == 93
req.max_tokens = 10 req.max_tokens = 10
......
...@@ -71,7 +71,7 @@ def get_logits_processors( ...@@ -71,7 +71,7 @@ def get_logits_processors(
# Check if token_id is within the vocab size # Check if token_id is within the vocab size
for token_id, bias in clamped_logit_bias.items(): for token_id, bias in clamped_logit_bias.items():
if token_id < 0 or token_id >= tokenizer.vocab_size: if token_id < 0 or token_id >= tokenizer.vocab_size:
raise ValueError("token_id in logit_bias contains " raise ValueError(f"token_id {token_id} in logit_bias contains "
"out-of-vocab token id") "out-of-vocab token id")
logits_processors.append( logits_processors.append(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment