Unverified Commit a873045c authored by weireweire's avatar weireweire Committed by GitHub
Browse files

fix: use dict sampling params in prefill warmup (#7797)


Co-authored-by: default avatarWeiliangl User <weiliangl@login-node.hosted.internal>
parent 91a8c6af
...@@ -29,13 +29,12 @@ async def _warmup_prefill_engine(engine: sgl.Engine, server_args) -> None: ...@@ -29,13 +29,12 @@ async def _warmup_prefill_engine(engine: sgl.Engine, server_args) -> None:
logging.info("Start of prefill disaggregation warmup ...") logging.info("Start of prefill disaggregation warmup ...")
try: try:
from sglang.srt.disaggregation.utils import FAKE_BOOTSTRAP_HOST from sglang.srt.disaggregation.utils import FAKE_BOOTSTRAP_HOST
from sglang.srt.sampling.sampling_params import SamplingParams
sampling_params = SamplingParams( sampling_params = {
temperature=0.0, "temperature": 0.0,
max_new_tokens=8, "max_new_tokens": 8,
ignore_eos=True, "ignore_eos": True,
) }
async def _do_warmup(): async def _do_warmup():
results = await engine.async_generate( results = await engine.async_generate(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment