[Bugfix] Fix LLM priority normalization for single-string prompts (#40011)

Signed-off-by: daiyu1111 <2356690121@qq.com>

[Bugfix] Fix LLM priority normalization for single-string prompts (#40011)
Signed-off-by: daiyu1111 <2356690121@qq.com>
a302a8fd · daiyu1111 · GitHub · 4e8c3f1c · a302a8fd · a302a8fd
Unverified Commit a302a8fd authored Apr 16, 2026 by daiyu1111 Committed by GitHub Apr 16, 2026
Show whitespace changes
Inline Side-by-side

Showing with 7 additions and 1 deletion

tests/entrypoints/llm/test_generate.py tests/entrypoints/llm/test_generate.py +6 -0

vllm/entrypoints/llm.py vllm/entrypoints/llm.py +1 -1

No files found.
--- a/tests/entrypoints/llm/test_generate.py
+++ b/tests/entrypoints/llm/test_generate.py
@@ -91,6 +91,12 @@ def test_multiple_priority(llm: LLM):
        outputs = llm.generate(PROMPTS, sampling_params=None, priority=[])
+def test_single_prompt_priority(llm: LLM):
+    # Single string prompts should be normalized to one request.
+    outputs = llm.generate(PROMPTS[0], sampling_params=None, priority=[0])
+    assert len(outputs) == 1
 def test_max_model_len():
    max_model_len = 20
    llm = LLM(

--- a/vllm/entrypoints/llm.py
+++ b/vllm/entrypoints/llm.py
@@ -1575,7 +1575,7 @@ class LLM:
        seq_prompts = prompt_to_seq(prompts)
        seq_params = self._params_to_seq(params, len(seq_prompts))
        seq_lora_requests = self._lora_request_to_seq(lora_request, len(seq_prompts))
-        seq_priority = self._priority_to_seq(priority, len(prompts))
+        seq_priority = self._priority_to_seq(priority, len(seq_prompts))
        return self._render_and_add_requests(
            prompts=(