"vscode:/vscode.git/clone" did not exist on "29d1ffc5b4c763ef76aff9e3f617fa60dd292418"
Unverified Commit a1d82466 authored by Ifta khairul Alam Adil's avatar Ifta khairul Alam Adil Committed by GitHub
Browse files

[Docs] Remove outdated async_scheduling limitation with speculative decoding (#32775)


Signed-off-by: default avatarIfta Khairul Alam Adil <ikaadil007@gmail.com>
Signed-off-by: default avatarIfta khairul Alam Adil <25082512+ikaadil@users.noreply.github.com>
parent 24a163ed
......@@ -133,9 +133,6 @@ class SchedulerConfig:
async_scheduling: bool = Field(default=None)
"""If set to False, disable async scheduling. Async scheduling helps to
avoid gaps in GPU utilization, leading to better latency and throughput.
It is currently not supported with some features such as
speculative decoding and pipeline parallelism, and will be automatically
disabled in those cases.
"""
stream_interval: int = Field(default=1, ge=1)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment