Unverified Commit 8bd696fa authored by Huy Do's avatar Huy Do Committed by GitHub
Browse files

[Bugfix] Incorrect another MM data format in vllm bench throughput (#26462)


Signed-off-by: default avatarHuy Do <huydhn@gmail.com>
parent bb6d8c21
...@@ -59,16 +59,16 @@ def run_vllm( ...@@ -59,16 +59,16 @@ def run_vllm(
prompts: list[Union[TextPrompt, TokensPrompt]] = [] prompts: list[Union[TextPrompt, TokensPrompt]] = []
sampling_params: list[SamplingParams] = [] sampling_params: list[SamplingParams] = []
for request in requests: for request in requests:
prompts.append( prompt = (
TokensPrompt( TokensPrompt(prompt_token_ids=request.prompt["prompt_token_ids"])
prompt_token_ids=request.prompt["prompt_token_ids"],
multi_modal_data=request.multi_modal_data,
)
if "prompt_token_ids" in request.prompt if "prompt_token_ids" in request.prompt
else TextPrompt( else TextPrompt(prompt=request.prompt)
prompt=request.prompt, multi_modal_data=request.multi_modal_data
)
) )
if request.multi_modal_data:
assert isinstance(request.multi_modal_data, dict)
prompt["multi_modal_data"] = request.multi_modal_data
prompts.append(prompt)
sampling_params.append( sampling_params.append(
SamplingParams( SamplingParams(
n=n, n=n,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment