Unverified Commit 2f0d3ba7 authored by Woosuk Kwon's avatar Woosuk Kwon Committed by GitHub
Browse files

[Model Runner V2] Minor simplification for finish_requests (#33048)


Signed-off-by: default avatarWoosuk Kwon <woosuk@inferact.ai>
parent edf927bc
...@@ -416,13 +416,12 @@ class GPUModelRunner(LoRAModelRunnerMixin): ...@@ -416,13 +416,12 @@ class GPUModelRunner(LoRAModelRunnerMixin):
torch.cuda.synchronize() torch.cuda.synchronize()
def finish_requests(self, scheduler_output: SchedulerOutput) -> None: def finish_requests(self, scheduler_output: SchedulerOutput) -> None:
if scheduler_output.preempted_req_ids is not None: finished_req_ids = scheduler_output.finished_req_ids
for req_id in scheduler_output.preempted_req_ids: if scheduler_output.preempted_req_ids:
self.req_states.remove_request(req_id) finished_req_ids = finished_req_ids.union(
if self.supports_mm_inputs: scheduler_output.preempted_req_ids
self.encoder_runner.remove_request(req_id) )
self.prompt_logprobs_worker.remove_request(req_id) for req_id in finished_req_ids:
for req_id in scheduler_output.finished_req_ids:
self.req_states.remove_request(req_id) self.req_states.remove_request(req_id)
if self.supports_mm_inputs: if self.supports_mm_inputs:
self.encoder_runner.remove_request(req_id) self.encoder_runner.remove_request(req_id)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment