audio.py 634 Bytes
Newer Older
1
from vllm.inputs.registry import InputContext
2
from vllm.multimodal.base import MultiModalKwargs, MultiModalPlugin
3
4
5
6
7
8
9
10


class AudioPlugin(MultiModalPlugin):
    """Plugin for audio data."""

    def get_data_key(self) -> str:
        return "audio"

11
    def _default_input_mapper(self, ctx: InputContext, data: object,
12
                              **mm_processor_kwargs) -> MultiModalKwargs:
13
14
15
16
17
        raise NotImplementedError("There is no default audio input mapper")

    def _default_max_multimodal_tokens(self, ctx: InputContext) -> int:
        raise NotImplementedError(
            "There is no default maximum multimodal tokens")