"vscode:/vscode.git/clone" did not exist on "2389df81555ae4cc9b819393282d24eb1440dfbc"
test_video_gpu_decoder.py 2 KB
Newer Older
1
import math
Prabhat Roy's avatar
Prabhat Roy committed
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
import os

import pytest
import torch
from torchvision.io import _HAS_VIDEO_DECODER, VideoReader

try:
    import av
except ImportError:
    av = None

VIDEO_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), "assets", "videos")

test_videos = [
    "RATRACE_wave_f_nm_np1_fr_goo_37.avi",
    "TrumanShow_wave_f_nm_np1_fr_med_26.avi",
    "v_SoccerJuggling_g23_c01.avi",
    "v_SoccerJuggling_g24_c01.avi",
    "R6llTwEh07w.mp4",
    "SOX5yA1l24A.mp4",
    "WUzgd7C1pWA.mp4",
]


@pytest.mark.skipif(_HAS_VIDEO_DECODER is False, reason="Didn't compile with support for gpu decoder")
class TestVideoGPUDecoder:
    @pytest.mark.skipif(av is None, reason="PyAV unavailable")
    def test_frame_reading(self):
        for test_video in test_videos:
            full_path = os.path.join(VIDEO_DIR, test_video)
            decoder = VideoReader(full_path, device="cuda:0")
            with av.open(full_path) as container:
                for av_frame in container.decode(container.streams.video[0]):
35
                    av_frames = torch.tensor(av_frame.to_rgb(src_colorspace="ITU709").to_ndarray())
Prabhat Roy's avatar
Prabhat Roy committed
36
                    vision_frames = next(decoder)["data"]
37
38
                    mean_delta = torch.mean(torch.abs(av_frames.float() - vision_frames.cpu().float()))
                    assert mean_delta < 0.75
Prabhat Roy's avatar
Prabhat Roy committed
39

40
41
42
43
44
45
46
47
48
49
50
51
    @pytest.mark.skipif(av is None, reason="PyAV unavailable")
    def test_metadata(self):
        for test_video in test_videos:
            full_path = os.path.join(VIDEO_DIR, test_video)
            decoder = VideoReader(full_path, device="cuda:0")
            video_metadata = decoder.get_metadata()["video"]
            with av.open(full_path) as container:
                video = container.streams.video[0]
                av_duration = float(video.duration * video.time_base)
                assert math.isclose(video_metadata["duration"], av_duration, rel_tol=1e-2)
                assert math.isclose(video_metadata["fps"], video.base_rate, rel_tol=1e-2)

Prabhat Roy's avatar
Prabhat Roy committed
52
53
54

if __name__ == "__main__":
    pytest.main([__file__])