Unverified Commit 7282ab74 authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

fix: update bench_speculative (#5649)

parent b0feda09
......@@ -993,6 +993,8 @@ async def benchmark(
async with semaphore:
return await request_func(request_func_input=request_func_input, pbar=pbar)
if not hasattr(args, "warmup_requests"):
args.warmup_requests = 1
# Warmup
print(f"Starting warmup with {args.warmup_requests} sequences...")
......
......@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size):
request_rate=float("inf"),
max_concurrency=batch_size,
disable_tqdm=False,
lora_name=None,
lora_names=None,
extra_request_body={},
profile=None,
)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment