Unverified Commit b89d37cb authored by Baron Liu's avatar Baron Liu Committed by GitHub
Browse files

[bugfix] Add 'disaggregation_mode' parameter to warmup function when compile...

[bugfix] Add 'disaggregation_mode' parameter to warmup function when compile deep_gemm manually (#8618)
parent 5deab128
......@@ -17,6 +17,7 @@ import time
import requests
from sglang.srt.disaggregation.utils import FAKE_BOOTSTRAP_HOST
from sglang.srt.entrypoints.http_server import launch_server
from sglang.srt.managers.io_struct import GenerateReqInput
from sglang.srt.managers.tokenizer_manager import TokenizerManager
......@@ -52,7 +53,9 @@ class CompileArgs:
@warmup("compile-deep-gemm")
async def warm_up_compile(tokenizer_manager: TokenizerManager):
async def warm_up_compile(
disaggregation_mode: str, tokenizer_manager: TokenizerManager
):
print("\nGenerate warm up request for compiling DeepGEMM...\n")
generate_req_input = GenerateReqInput(
input_ids=[0, 1, 2, 3],
......@@ -62,6 +65,10 @@ async def warm_up_compile(tokenizer_manager: TokenizerManager):
"ignore_eos": True,
},
)
if disaggregation_mode != "null":
generate_req_input.bootstrap_room = 0
generate_req_input.bootstrap_host = FAKE_BOOTSTRAP_HOST
await tokenizer_manager.generate_request(generate_req_input, None).__anext__()
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment