Unverified Commit 4ba48b79 authored by Biswa Panda's avatar Biswa Panda Committed by GitHub
Browse files

feat: add model field to multimodal protocol for LoRA identity (#6382)

parent 46d9f448
...@@ -155,6 +155,7 @@ class MultimodalPDWorkerHandler(BaseWorkerHandler): ...@@ -155,6 +155,7 @@ class MultimodalPDWorkerHandler(BaseWorkerHandler):
), ),
sampling_params=sampling_params, sampling_params=sampling_params,
request_id=request_id, request_id=request_id,
model=raw_request.get("model"),
multimodal_inputs=multimodal_groups, multimodal_inputs=multimodal_groups,
) )
......
...@@ -175,6 +175,8 @@ class MultiModalGroup(BaseModel): ...@@ -175,6 +175,8 @@ class MultiModalGroup(BaseModel):
class vLLMMultimodalRequest(vLLMGenerateRequest): class vLLMMultimodalRequest(vLLMGenerateRequest):
model_config = ConfigDict(arbitrary_types_allowed=True) model_config = ConfigDict(arbitrary_types_allowed=True)
# LoRA adapter name (matches the name used in load_lora)
model: Optional[str] = None
# Decode-only worker can have None for multimodal_inputs # Decode-only worker can have None for multimodal_inputs
multimodal_inputs: Optional[List[MultiModalGroup]] = Field(default_factory=list) multimodal_inputs: Optional[List[MultiModalGroup]] = Field(default_factory=list)
# Add these fields for Qwen VL (mRoPE) decode-only worker # Add these fields for Qwen VL (mRoPE) decode-only worker
......
...@@ -143,6 +143,7 @@ class Processor(ProcessMixIn): ...@@ -143,6 +143,7 @@ class Processor(ProcessMixIn):
engine_prompt=engine_prompt, engine_prompt=engine_prompt,
sampling_params=sampling_params, sampling_params=sampling_params,
request_id=request_id, request_id=request_id,
model=raw_request.model,
multimodal_input=multimodal_input, multimodal_input=multimodal_input,
) )
......
...@@ -156,6 +156,8 @@ class MultiModalInput(BaseModel): ...@@ -156,6 +156,8 @@ class MultiModalInput(BaseModel):
class vLLMMultimodalRequest(vLLMGenerateRequest): class vLLMMultimodalRequest(vLLMGenerateRequest):
model_config = ConfigDict(arbitrary_types_allowed=True) model_config = ConfigDict(arbitrary_types_allowed=True)
# LoRA adapter name (matches the name used in load_lora)
model: Optional[str] = None
multimodal_input: Optional[MultiModalInput] = Field(default_factory=MultiModalInput) multimodal_input: Optional[MultiModalInput] = Field(default_factory=MultiModalInput)
image_grid_thw: Optional[List[Any]] = None image_grid_thw: Optional[List[Any]] = None
embeddings_shape: Optional[ embeddings_shape: Optional[
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment