Unverified Commit 731a6940 authored by Benji Beck's avatar Benji Beck Committed by GitHub
Browse files

Migrate whisper inputs to TensorSchema (#23505)


Signed-off-by: default avatarBenji Beck <benjibeck@meta.com>
parent e9b92dcd
...@@ -4,7 +4,7 @@ ...@@ -4,7 +4,7 @@
import math import math
from collections.abc import Iterable, Mapping, Sequence from collections.abc import Iterable, Mapping, Sequence
from contextlib import nullcontext from contextlib import nullcontext
from typing import Literal, Optional, TypedDict, Union, cast from typing import Annotated, Literal, Optional, Union, cast
import numpy as np import numpy as np
import torch import torch
...@@ -40,6 +40,7 @@ from vllm.multimodal.processing import (BaseProcessingInfo, ...@@ -40,6 +40,7 @@ from vllm.multimodal.processing import (BaseProcessingInfo,
PromptReplacement, PromptUpdate) PromptReplacement, PromptUpdate)
from vllm.multimodal.profiling import BaseDummyInputsBuilder from vllm.multimodal.profiling import BaseDummyInputsBuilder
from vllm.transformers_utils.processor import cached_get_processor from vllm.transformers_utils.processor import cached_get_processor
from vllm.utils.tensor_schema import TensorSchema, TensorShape
from .interfaces import (MultiModalEmbeddings, SupportsMultiModal, from .interfaces import (MultiModalEmbeddings, SupportsMultiModal,
SupportsTranscription, SupportsV0Only) SupportsTranscription, SupportsV0Only)
...@@ -111,9 +112,16 @@ ISO639_1_SUPPORTED_LANGS = { ...@@ -111,9 +112,16 @@ ISO639_1_SUPPORTED_LANGS = {
} }
class WhisperAudioInputs(TypedDict): class WhisperAudioInputs(TensorSchema):
input_features: NestedTensors """
"""Shape: `(batch_size, 128, M)`""" Dimensions:
- b: Batch size
- nmb: Number of mel bins
- t: Time frames (M)
"""
input_features: Annotated[Optional[NestedTensors],
TensorShape("b", "nmb", "t")]
class WhisperPositionalEmbedding(nn.Embedding): class WhisperPositionalEmbedding(nn.Embedding):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment