"tests/vscode:/vscode.git/clone" did not exist on "7bdc16197f7fe7890fc2b91d020744a82a024984"
Unverified Commit dd83e7e9 authored by ybyang's avatar ybyang Committed by GitHub
Browse files

[Bug fix] need record start time in pd mode (#5425)

parent 0769b14b
...@@ -959,14 +959,12 @@ class Scheduler( ...@@ -959,14 +959,12 @@ class Scheduler(
self._add_request_to_queue(req) self._add_request_to_queue(req)
def _add_request_to_queue(self, req: Req): def _add_request_to_queue(self, req: Req):
req.queue_time_start = time.time()
if self.disaggregation_mode == DisaggregationMode.PREFILL: if self.disaggregation_mode == DisaggregationMode.PREFILL:
self.disagg_prefill_pending_queue.add(req) self.disagg_prefill_pending_queue.add(req)
elif self.disaggregation_mode == DisaggregationMode.DECODE: elif self.disaggregation_mode == DisaggregationMode.DECODE:
self.disagg_decode_prealloc_queue.add(req) self.disagg_decode_prealloc_queue.add(req)
else: else:
req.queue_time_start = time.time()
self.waiting_queue.append(req) self.waiting_queue.append(req)
def _extend_requests_to_queue(self, reqs: List[Req], is_retracted: bool = False): def _extend_requests_to_queue(self, reqs: List[Req], is_retracted: bool = False):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment