Unverified Commit 36bf2131 authored by Nathan Price's avatar Nathan Price Committed by GitHub
Browse files

[Bugfix] Add missing dynamic_arg_dims for Qwen3-ASR torch.compile (#35869)


Signed-off-by: default avatarNathan Price <nathan@abridge.com>
Signed-off-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
Co-authored-by: default avatarIsotr0py <mozf@mail2.sysu.edu.cn>
parent 6f0dd938
......@@ -22,7 +22,6 @@ from collections.abc import AsyncGenerator, Mapping
import numpy as np
import torch
from vllm.compilation.decorators import support_torch_compile
from vllm.config import ModelConfig, SpeechToTextConfig, VllmConfig
from vllm.inputs.data import PromptType, TokensPrompt
from vllm.logger import init_logger
......@@ -177,7 +176,6 @@ class Qwen3ASRRealtimeMultiModalProcessor(Qwen3ASRMultiModalProcessor):
info=Qwen3ASRProcessingInfo,
dummy_inputs=Qwen3ASRDummyInputsBuilder,
)
@support_torch_compile
class Qwen3ASRRealtimeGeneration(Qwen3ASRForConditionalGeneration, SupportsRealtime):
realtime_max_tokens = 64
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment