Unverified Commit c428e8d8 authored by baonudesifeizhai's avatar baonudesifeizhai Committed by GitHub
Browse files

Fix io processor pooling #28273 (#28484)


Signed-off-by: default avatarbaonudesifeizhai <baonudesifeizhai@gmail.com>
parent 5e973209
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
import asyncio import asyncio
import json import json
import time import time
from collections.abc import AsyncGenerator from collections.abc import AsyncGenerator, Sequence
from typing import Final, cast from typing import Final, cast
import jinja2 import jinja2
...@@ -122,6 +122,10 @@ class OpenAIServingPooling(OpenAIServing): ...@@ -122,6 +122,10 @@ class OpenAIServingPooling(OpenAIServing):
engine_prompts = await self.io_processor.pre_process_async( engine_prompts = await self.io_processor.pre_process_async(
prompt=validated_prompt, request_id=request_id prompt=validated_prompt, request_id=request_id
) )
if not isinstance(engine_prompts, Sequence) or isinstance(
engine_prompts, (str, bytes, bytearray)
):
engine_prompts = [engine_prompts]
elif isinstance(request, PoolingChatRequest): elif isinstance(request, PoolingChatRequest):
error_check_ret = self._validate_chat_template( error_check_ret = self._validate_chat_template(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment