Commit e5fc1b17 authored by zhuwenwen's avatar zhuwenwen
Browse files

Merge branch 'v0.11.0-dev_scheduler' into 'v0.11.0-dev'

修复schedule_default,schedule_split_pd,因kv cache耗尽,服务挂掉的问题

See merge request dcutoolkit/deeplearing/vllm!266
parents 4e8af7e8 c833e64e
...@@ -344,7 +344,9 @@ class Scheduler(SchedulerInterface): ...@@ -344,7 +344,9 @@ class Scheduler(SchedulerInterface):
break break
request = self.waiting.peek_request() request = self.waiting.peek_request()
if request.is_finished():
self.waiting.pop_request()
continue
# KVTransfer: skip request if still waiting for remote kvs. # KVTransfer: skip request if still waiting for remote kvs.
if request.status == RequestStatus.WAITING_FOR_REMOTE_KVS: if request.status == RequestStatus.WAITING_FOR_REMOTE_KVS:
is_ready = self._update_waiting_for_remote_kv(request) is_ready = self._update_waiting_for_remote_kv(request)
...@@ -672,7 +674,9 @@ class Scheduler(SchedulerInterface): ...@@ -672,7 +674,9 @@ class Scheduler(SchedulerInterface):
break break
request = self.waiting.peek_request() request = self.waiting.peek_request()
if request.is_finished():
self.waiting.pop_request()
continue
# KVTransfer: skip request if still waiting for remote kvs. # KVTransfer: skip request if still waiting for remote kvs.
if request.status == RequestStatus.WAITING_FOR_REMOTE_KVS: if request.status == RequestStatus.WAITING_FOR_REMOTE_KVS:
is_ready = self._update_waiting_for_remote_kv(request) is_ready = self._update_waiting_for_remote_kv(request)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment