Unverified Commit 5f98e91e authored by Richard Huo's avatar Richard Huo Committed by GitHub
Browse files

test: fix KV Router and KVBM tests in CI (#3848)

parent 4e496691
...@@ -223,8 +223,10 @@ class LLMServerManager: ...@@ -223,8 +223,10 @@ class LLMServerManager:
) )
print(f"Decoder process started with PID: {self.process_decoder.pid}") print(f"Decoder process started with PID: {self.process_decoder.pid}")
# Give decoder time to start up # The prefiller and decoder cannot download the model simultaneously,
time.sleep(5) # because the Hugging Face rust library (invoked by fetch_llm) needs to hold an exclusive lock on the model files.
print("Sleeping for 60 seconds to allow the decoder to download the model. ")
time.sleep(60)
# Launch prefiller # Launch prefiller
self.process_prefiller = subprocess.Popen( self.process_prefiller = subprocess.Popen(
......
...@@ -71,7 +71,7 @@ sglang_configs = { ...@@ -71,7 +71,7 @@ sglang_configs = {
request_payloads=[ request_payloads=[
chat_payload_default( chat_payload_default(
expected_log=[ expected_log=[
r"ZMQ listener .* received batch with \d+ events \(seq=\d+\)", r"ZMQ listener .* received batch with \d+ events \(seq=\d+(?:, [^)]*)?\)",
r"Event processor for worker_id \d+ processing event: Stored\(", r"Event processor for worker_id \d+ processing event: Stored\(",
r"Selected worker: worker_id=\d+ dp_rank=.*?, logit: ", r"Selected worker: worker_id=\d+ dp_rank=.*?, logit: ",
] ]
......
...@@ -51,7 +51,7 @@ vllm_configs = { ...@@ -51,7 +51,7 @@ vllm_configs = {
request_payloads=[ request_payloads=[
chat_payload_default( chat_payload_default(
expected_log=[ expected_log=[
r"ZMQ listener .* received batch with \d+ events \(seq=\d+\)", r"ZMQ listener .* received batch with \d+ events \(seq=\d+(?:, [^)]*)?\)",
r"Event processor for worker_id \d+ processing event: Stored\(", r"Event processor for worker_id \d+ processing event: Stored\(",
r"Selected worker: worker_id=\d+ dp_rank=.*?, logit: ", r"Selected worker: worker_id=\d+ dp_rank=.*?, logit: ",
] ]
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment