Unverified Commit 1dafb29f authored by Cyrus Leung's avatar Cyrus Leung Committed by GitHub
Browse files

[Benchmark] Avoid unnecessary video download in MMVU (#35618)


Signed-off-by: default avatarDarkLight1337 <tlleungac@connect.ust.hk>
parent 49b9ae32
...@@ -31,6 +31,7 @@ from tempfile import NamedTemporaryFile ...@@ -31,6 +31,7 @@ from tempfile import NamedTemporaryFile
from typing import Any, cast from typing import Any, cast
import numpy as np import numpy as np
from huggingface_hub import snapshot_download
from PIL import Image from PIL import Image
from typing_extensions import deprecated from typing_extensions import deprecated
...@@ -2680,6 +2681,14 @@ class MMVUDataset(HuggingFaceDataset): ...@@ -2680,6 +2681,14 @@ class MMVUDataset(HuggingFaceDataset):
+ (" ".join(f"{k}.{v}" for k, v in x["choices"].items())), + (" ".join(f"{k}.{v}" for k, v in x["choices"].items())),
} }
def __init__(self, **kwargs) -> None:
super().__init__(**kwargs)
self._remote_path_root = (
f"https://huggingface.co/datasets/{self.hf_name}/resolve/main"
)
self._local_path_root = snapshot_download(self.hf_name, repo_type="dataset")
def sample( def sample(
self, self,
tokenizer: TokenizerLike, tokenizer: TokenizerLike,
...@@ -2702,7 +2711,9 @@ class MMVUDataset(HuggingFaceDataset): ...@@ -2702,7 +2711,9 @@ class MMVUDataset(HuggingFaceDataset):
break break
prompt = parser_fn(item) prompt = parser_fn(item)
mm_content = process_video(item["video"]) mm_content = process_video(
item["video"].replace(self._remote_path_root, self._local_path_root)
)
prompt_len = len(tokenizer.encode(prompt)) prompt_len = len(tokenizer.encode(prompt))
if enable_multimodal_chat: if enable_multimodal_chat:
# Note: when chat is enabled the request prompt_len is no longer # Note: when chat is enabled the request prompt_len is no longer
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment