Unverified Commit 7282ab74 authored by Yineng Zhang's avatar Yineng Zhang Committed by GitHub
Browse files

fix: update bench_speculative (#5649)

parent b0feda09
...@@ -993,6 +993,8 @@ async def benchmark( ...@@ -993,6 +993,8 @@ async def benchmark(
async with semaphore: async with semaphore:
return await request_func(request_func_input=request_func_input, pbar=pbar) return await request_func(request_func_input=request_func_input, pbar=pbar)
if not hasattr(args, "warmup_requests"):
args.warmup_requests = 1
# Warmup # Warmup
print(f"Starting warmup with {args.warmup_requests} sequences...") print(f"Starting warmup with {args.warmup_requests} sequences...")
......
...@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size): ...@@ -85,7 +85,7 @@ def send_one_batch(base_url, num_prompts, batch_size):
request_rate=float("inf"), request_rate=float("inf"),
max_concurrency=batch_size, max_concurrency=batch_size,
disable_tqdm=False, disable_tqdm=False,
lora_name=None, lora_names=None,
extra_request_body={}, extra_request_body={},
profile=None, profile=None,
) )
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment