Unverified Commit 74670964 authored by Rui Qiao's avatar Rui Qiao Committed by GitHub
Browse files

[Misc] Fix typos in scheduler.py (#7285)


Signed-off-by: default avatarRui Qiao <ruisearch42@gmail.com>
parent e53dfd3e
......@@ -678,7 +678,7 @@ class Scheduler:
all tokens.
Returns:
SchedulerSwappedInOutputs.
SchedulerPrefillOutputs.
"""
ignored_seq_groups: List[SequenceGroup] = []
seq_groups: List[SequenceGroup] = []
......@@ -851,7 +851,7 @@ class Scheduler:
preempted=preempted,
)
def _schedule_chunked_prefill(self):
def _schedule_chunked_prefill(self) -> SchedulerOutputs:
"""Schedule queued requests.
Chunked prefill allows to chunk prefill requests, batch them together
......@@ -862,7 +862,7 @@ class Scheduler:
The policy can sustain the high GPU utilization because it can put
prefill and decodes requests to the same batch, while it improves
inter token latency because decodes requests don't need to blocked
inter token latency because decodes requests don't need to be blocked
by prefill requests.
"""
budget = SchedulingBudget(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment