Unverified Commit d7543862 authored by Cyrus Leung's avatar Cyrus Leung Committed by GitHub
Browse files

[Misc] Rename assets for testing (#17575)


Signed-off-by: default avatarDarkLight1337 <tlleungac@connect.ust.hk>
parent c777df79
...@@ -4,7 +4,7 @@ import pytest ...@@ -4,7 +4,7 @@ import pytest
from vllm.multimodal import MULTIMODAL_REGISTRY from vllm.multimodal import MULTIMODAL_REGISTRY
from ....conftest import _ImageAssets from ....conftest import ImageTestAssets
from ...utils import build_model_context from ...utils import build_model_context
...@@ -22,7 +22,7 @@ from ...utils import build_model_context ...@@ -22,7 +22,7 @@ from ...utils import build_model_context
@pytest.mark.parametrize("num_imgs", [1, 2]) @pytest.mark.parametrize("num_imgs", [1, 2])
@pytest.mark.parametrize("kwargs_on_init", [True, False]) @pytest.mark.parametrize("kwargs_on_init", [True, False])
def test_processor_override( def test_processor_override(
image_assets: _ImageAssets, image_assets: ImageTestAssets,
model_id: str, model_id: str,
mm_processor_kwargs: dict[str, int], mm_processor_kwargs: dict[str, int],
expected_toks_per_img: int, expected_toks_per_img: int,
......
...@@ -4,7 +4,7 @@ import pytest ...@@ -4,7 +4,7 @@ import pytest
from vllm.multimodal import MULTIMODAL_REGISTRY from vllm.multimodal import MULTIMODAL_REGISTRY
from ....conftest import _ImageAssets from ....conftest import ImageTestAssets
from ...utils import build_model_context from ...utils import build_model_context
...@@ -22,7 +22,7 @@ from ...utils import build_model_context ...@@ -22,7 +22,7 @@ from ...utils import build_model_context
@pytest.mark.parametrize("num_imgs", [1, 2]) @pytest.mark.parametrize("num_imgs", [1, 2])
@pytest.mark.parametrize("kwargs_on_init", [True, False]) @pytest.mark.parametrize("kwargs_on_init", [True, False])
def test_processor_override( def test_processor_override(
image_assets: _ImageAssets, image_assets: ImageTestAssets,
model_id: str, model_id: str,
mm_processor_kwargs: dict[str, int], mm_processor_kwargs: dict[str, int],
expected_toks_per_img: int, expected_toks_per_img: int,
......
...@@ -4,7 +4,7 @@ import pytest ...@@ -4,7 +4,7 @@ import pytest
from vllm.multimodal import MULTIMODAL_REGISTRY from vllm.multimodal import MULTIMODAL_REGISTRY
from ....conftest import _ImageAssets from ....conftest import ImageTestAssets
from ...utils import build_model_context from ...utils import build_model_context
...@@ -19,7 +19,7 @@ from ...utils import build_model_context ...@@ -19,7 +19,7 @@ from ...utils import build_model_context
@pytest.mark.parametrize("num_imgs", [1, 2]) @pytest.mark.parametrize("num_imgs", [1, 2])
@pytest.mark.parametrize("kwargs_on_init", [True, False]) @pytest.mark.parametrize("kwargs_on_init", [True, False])
def test_processor_override( def test_processor_override(
image_assets: _ImageAssets, image_assets: ImageTestAssets,
model_id: str, model_id: str,
mm_processor_kwargs: dict[str, object], mm_processor_kwargs: dict[str, object],
expected_toks_per_img: int, expected_toks_per_img: int,
......
...@@ -5,7 +5,7 @@ from transformers import SmolVLMConfig ...@@ -5,7 +5,7 @@ from transformers import SmolVLMConfig
from vllm.multimodal import MULTIMODAL_REGISTRY from vllm.multimodal import MULTIMODAL_REGISTRY
from ....conftest import _ImageAssets from ....conftest import ImageTestAssets
from ...utils import build_model_context from ...utils import build_model_context
...@@ -21,7 +21,7 @@ from ...utils import build_model_context ...@@ -21,7 +21,7 @@ from ...utils import build_model_context
@pytest.mark.parametrize("num_imgs", [1, 2]) @pytest.mark.parametrize("num_imgs", [1, 2])
@pytest.mark.parametrize("kwargs_on_init", [True, False]) @pytest.mark.parametrize("kwargs_on_init", [True, False])
def test_processor_override( def test_processor_override(
image_assets: _ImageAssets, image_assets: ImageTestAssets,
model_id: str, model_id: str,
mm_processor_kwargs: dict[str, object], mm_processor_kwargs: dict[str, object],
expected_toks_per_img: int, expected_toks_per_img: int,
......
...@@ -7,7 +7,7 @@ import torch ...@@ -7,7 +7,7 @@ import torch
from vllm.multimodal.image import rescale_image_size from vllm.multimodal.image import rescale_image_size
from ...conftest import IMAGE_ASSETS, VllmRunner, _ImageAssets from ...conftest import IMAGE_ASSETS, ImageTestAssets, VllmRunner
from ..utils import check_logprobs_close from ..utils import check_logprobs_close
HF_IMAGE_PROMPTS = IMAGE_ASSETS.prompts({ HF_IMAGE_PROMPTS = IMAGE_ASSETS.prompts({
...@@ -20,7 +20,7 @@ HF_IMAGE_PROMPTS = IMAGE_ASSETS.prompts({ ...@@ -20,7 +20,7 @@ HF_IMAGE_PROMPTS = IMAGE_ASSETS.prompts({
def run_awq_test( def run_awq_test(
vllm_runner: type[VllmRunner], vllm_runner: type[VllmRunner],
image_assets: _ImageAssets, image_assets: ImageTestAssets,
source_model: str, source_model: str,
quant_model: str, quant_model: str,
*, *,
......
...@@ -18,19 +18,25 @@ except ImportError: ...@@ -18,19 +18,25 @@ except ImportError:
ASSET_DIR = "multimodal_asset" ASSET_DIR = "multimodal_asset"
AudioAssetName = Literal["winning_call", "mary_had_lamb"]
@dataclass(frozen=True) @dataclass(frozen=True)
class AudioAsset: class AudioAsset:
name: Literal["winning_call", "mary_had_lamb"] name: AudioAssetName
@property
def filename(self) -> str:
return f"{self.name}.ogg"
@property @property
def audio_and_sample_rate(self) -> tuple[npt.NDArray, float]: def audio_and_sample_rate(self) -> tuple[npt.NDArray, float]:
audio_path = get_vllm_public_assets(filename=f"{self.name}.ogg", audio_path = get_vllm_public_assets(filename=self.filename,
s3_prefix=ASSET_DIR) s3_prefix=ASSET_DIR)
return librosa.load(audio_path, sr=None) return librosa.load(audio_path, sr=None)
def get_local_path(self) -> Path: def get_local_path(self) -> Path:
return get_vllm_public_assets(filename=f"{self.name}.ogg", return get_vllm_public_assets(filename=self.filename,
s3_prefix=ASSET_DIR) s3_prefix=ASSET_DIR)
@property @property
......
...@@ -10,10 +10,12 @@ from .base import get_vllm_public_assets ...@@ -10,10 +10,12 @@ from .base import get_vllm_public_assets
VLM_IMAGES_DIR = "vision_model_images" VLM_IMAGES_DIR = "vision_model_images"
ImageAssetName = Literal["stop_sign", "cherry_blossom"]
@dataclass(frozen=True) @dataclass(frozen=True)
class ImageAsset: class ImageAsset:
name: Literal["stop_sign", "cherry_blossom"] name: ImageAssetName
@property @property
def pil_image(self) -> Image.Image: def pil_image(self) -> Image.Image:
......
...@@ -2,7 +2,7 @@ ...@@ -2,7 +2,7 @@
from dataclasses import dataclass from dataclasses import dataclass
from functools import lru_cache from functools import lru_cache
from typing import Literal, Optional from typing import ClassVar, Literal, Optional
import cv2 import cv2
import numpy as np import numpy as np
...@@ -76,20 +76,31 @@ def video_to_pil_images_list(path: str, ...@@ -76,20 +76,31 @@ def video_to_pil_images_list(path: str,
] ]
VideoAssetName = Literal["baby_reading"]
@dataclass(frozen=True) @dataclass(frozen=True)
class VideoAsset: class VideoAsset:
name: Literal["sample_demo_1"] name: VideoAssetName
num_frames: int = -1 num_frames: int = -1
_NAME_TO_FILE: ClassVar[dict[VideoAssetName, str]] = {
"baby_reading": "sample_demo_1.mp4",
}
@property
def filename(self) -> str:
return self._NAME_TO_FILE[self.name]
@property @property
def pil_images(self) -> list[Image.Image]: def pil_images(self) -> list[Image.Image]:
video_path = download_video_asset(self.name + ".mp4") video_path = download_video_asset(self.filename)
ret = video_to_pil_images_list(video_path, self.num_frames) ret = video_to_pil_images_list(video_path, self.num_frames)
return ret return ret
@property @property
def np_ndarrays(self) -> npt.NDArray: def np_ndarrays(self) -> npt.NDArray:
video_path = download_video_asset(self.name + ".mp4") video_path = download_video_asset(self.filename)
ret = video_to_ndarrays(video_path, self.num_frames) ret = video_to_ndarrays(video_path, self.num_frames)
return ret return ret
...@@ -99,5 +110,5 @@ class VideoAsset: ...@@ -99,5 +110,5 @@ class VideoAsset:
See also: examples/offline_inference/qwen2_5_omni/only_thinker.py See also: examples/offline_inference/qwen2_5_omni/only_thinker.py
""" """
video_path = download_video_asset(self.name + ".mp4") video_path = download_video_asset(self.filename)
return librosa.load(video_path, sr=sampling_rate)[0] return librosa.load(video_path, sr=sampling_rate)[0]
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment