Unverified Commit 844a8f42 authored by Wenxuan Tan's avatar Wenxuan Tan Committed by GitHub
Browse files

Fix LoRA bench (#6719)

parent 791b3bfa
......@@ -162,13 +162,13 @@ async def benchmark(
raise ValueError(f"Unknown backend: {backend}")
print("Starting initial single prompt test run...")
test_prompt, test_prompt_len, test_output_len = input_requests[0]
test_request = input_requests[0]
test_input = RequestFuncInput(
model=model_id,
prompt=test_prompt,
prompt=test_request.prompt,
api_url=api_url,
prompt_len=test_prompt_len,
output_len=test_output_len,
prompt_len=test_request.prompt_len,
output_len=test_request.output_len,
lora_name="dummy", # the lora_name argument will not be used
image_data=None,
extra_request_body=extra_request_body,
......@@ -187,13 +187,12 @@ async def benchmark(
benchmark_start_time = time.perf_counter()
tasks: List[asyncio.Task] = []
async for request in get_request(input_requests, request_rate):
prompt, prompt_len, output_len = request
request_func_input = RequestFuncInput(
model=model_id,
prompt=prompt,
prompt=request.prompt,
api_url=api_url,
prompt_len=prompt_len,
output_len=output_len,
prompt_len=request.prompt_len,
output_len=request.output_len,
lora_name="dummy",
image_data=None,
extra_request_body=extra_request_body,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment