audio.py 1.16 KB
Newer Older
1
2
# SPDX-License-Identifier: Apache-2.0

3
from dataclasses import dataclass
4
from pathlib import Path
5
from typing import Literal
6
7
from urllib.parse import urljoin

8
import numpy.typing as npt
9

10
11
12
13
14
15
16
17
from vllm.utils import PlaceholderModule

from .base import VLLM_S3_BUCKET_URL, get_vllm_public_assets

try:
    import librosa
except ImportError:
    librosa = PlaceholderModule("librosa")  # type: ignore[assignment]
18
19
20

ASSET_DIR = "multimodal_asset"

21
22
AudioAssetName = Literal["winning_call", "mary_had_lamb"]

23
24
25

@dataclass(frozen=True)
class AudioAsset:
26
27
28
29
30
    name: AudioAssetName

    @property
    def filename(self) -> str:
        return f"{self.name}.ogg"
31
32

    @property
33
    def audio_and_sample_rate(self) -> tuple[npt.NDArray, float]:
34
        audio_path = get_vllm_public_assets(filename=self.filename,
35
                                            s3_prefix=ASSET_DIR)
36
        return librosa.load(audio_path, sr=None)
37

38
    def get_local_path(self) -> Path:
39
        return get_vllm_public_assets(filename=self.filename,
40
41
                                      s3_prefix=ASSET_DIR)

42
43
    @property
    def url(self) -> str:
44
        return urljoin(VLLM_S3_BUCKET_URL, f"{ASSET_DIR}/{self.name}.ogg")