Unverified Commit 93be7e86 authored by ishandhanani's avatar ishandhanani Committed by GitHub
Browse files

fix: respect `--ignore-eos` in PD case for benchmarking (#12597)

parent 60b0754c
...@@ -774,9 +774,9 @@ class DecodeTransferQueue: ...@@ -774,9 +774,9 @@ class DecodeTransferQueue:
decode_req.req.time_stats.wait_queue_entry_time = time.perf_counter() decode_req.req.time_stats.wait_queue_entry_time = time.perf_counter()
# special handling for corner cases # special handling for corner cases
should_finish = ( should_finish = decode_req.req.sampling_params.max_new_tokens == 1 or (
decode_req.req.sampling_params.max_new_tokens == 1 not decode_req.req.sampling_params.ignore_eos
or decode_req.req.output_ids[-1] in decode_req.req.eos_token_ids and decode_req.req.output_ids[-1] in decode_req.req.eos_token_ids
) )
if should_finish: if should_finish:
# finish immediately # finish immediately
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment