Commit 4e8af7e8 authored by zhuwenwen's avatar zhuwenwen
Browse files

根据不同场景,更新默认调度和分离调度的选择

parent acf9f945
...@@ -1084,10 +1084,15 @@ class Scheduler(SchedulerInterface): ...@@ -1084,10 +1084,15 @@ class Scheduler(SchedulerInterface):
return scheduler_output return scheduler_output
def schedule(self) -> SchedulerOutput: def schedule(self) -> SchedulerOutput:
if (self.full_cuda_graph and self.use_mla and self.num_spec_tokens > 0) or envs.VLLM_USE_PD_SPLIT: if envs.VLLM_USE_PD_SPLIT:
return self.schedule_split_pd() return self.schedule_split_pd()
else: else:
return self.schedule_default() if self.connector is not None:
return self.schedule_default()
if self.full_cuda_graph and self.use_mla and self.num_spec_tokens > 0 :
return self.schedule_split_pd()
else:
return self.schedule_default()
def _update_after_schedule( def _update_after_schedule(
self, self,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment