test_datasets_samplers.py 4.58 KB
Newer Older
1
2
3
4
import contextlib
import sys
import os
import torch
5
import pytest
6
7

from torchvision import io
8
9
10
11
12
from torchvision.datasets.samplers import (
    DistributedSampler,
    RandomClipSampler,
    UniformClipSampler,
)
13
14
15
from torchvision.datasets.video_utils import VideoClips, unfold
from torchvision import get_video_backend

16
from common_utils import get_tmp_dir, assert_equal
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31


@contextlib.contextmanager
def get_list_of_videos(num_videos=5, sizes=None, fps=None):
    with get_tmp_dir() as tmp_dir:
        names = []
        for i in range(num_videos):
            if sizes is None:
                size = 5 * (i + 1)
            else:
                size = sizes[i]
            if fps is None:
                f = 5
            else:
                f = fps[i]
32
            data = torch.randint(0, 256, (size, 300, 400, 3), dtype=torch.uint8)
33
34
35
36
37
38
39
            name = os.path.join(tmp_dir, "{}.mp4".format(i))
            names.append(name)
            io.write_video(name, data, fps=f)

        yield names


40
41
@pytest.mark.skipif(not io.video._av_available(), reason="this test requires av")
class TestDatasetsSamplers:
42
43
44
45
    def test_random_clip_sampler(self):
        with get_list_of_videos(num_videos=3, sizes=[25, 25, 25]) as video_list:
            video_clips = VideoClips(video_list, 5, 5)
            sampler = RandomClipSampler(video_clips, 3)
46
            assert len(sampler) == 3 * 3
47
            indices = torch.tensor(list(iter(sampler)))
48
            videos = torch.div(indices, 5, rounding_mode='floor')
49
            v_idxs, count = torch.unique(videos, return_counts=True)
50
51
            assert_equal(v_idxs, torch.tensor([0, 1, 2]))
            assert_equal(count, torch.tensor([3, 3, 3]))
52
53
54
55
56

    def test_random_clip_sampler_unequal(self):
        with get_list_of_videos(num_videos=3, sizes=[10, 25, 25]) as video_list:
            video_clips = VideoClips(video_list, 5, 5)
            sampler = RandomClipSampler(video_clips, 3)
57
            assert len(sampler) == 2 + 3 + 3
58
            indices = list(iter(sampler))
59
60
            assert 0 in indices
            assert 1 in indices
61
62
63
64
            # remove elements of the first video, to simplify testing
            indices.remove(0)
            indices.remove(1)
            indices = torch.tensor(indices) - 2
65
            videos = torch.div(indices, 5, rounding_mode='floor')
66
            v_idxs, count = torch.unique(videos, return_counts=True)
67
68
            assert_equal(v_idxs, torch.tensor([0, 1]))
            assert_equal(count, torch.tensor([3, 3]))
69
70
71
72
73

    def test_uniform_clip_sampler(self):
        with get_list_of_videos(num_videos=3, sizes=[25, 25, 25]) as video_list:
            video_clips = VideoClips(video_list, 5, 5)
            sampler = UniformClipSampler(video_clips, 3)
74
            assert len(sampler) == 3 * 3
75
            indices = torch.tensor(list(iter(sampler)))
76
            videos = torch.div(indices, 5, rounding_mode='floor')
77
            v_idxs, count = torch.unique(videos, return_counts=True)
78
79
80
            assert_equal(v_idxs, torch.tensor([0, 1, 2]))
            assert_equal(count, torch.tensor([3, 3, 3]))
            assert_equal(indices, torch.tensor([0, 2, 4, 5, 7, 9, 10, 12, 14]))
81
82
83
84
85

    def test_uniform_clip_sampler_insufficient_clips(self):
        with get_list_of_videos(num_videos=3, sizes=[10, 25, 25]) as video_list:
            video_clips = VideoClips(video_list, 5, 5)
            sampler = UniformClipSampler(video_clips, 3)
86
            assert len(sampler) == 3 * 3
87
            indices = torch.tensor(list(iter(sampler)))
88
            assert_equal(indices, torch.tensor([0, 0, 1, 2, 4, 6, 7, 9, 11]))
89

90
91
92
93
94
95
96
97
98
99
100
101
    def test_distributed_sampler_and_uniform_clip_sampler(self):
        with get_list_of_videos(num_videos=3, sizes=[25, 25, 25]) as video_list:
            video_clips = VideoClips(video_list, 5, 5)
            clip_sampler = UniformClipSampler(video_clips, 3)

            distributed_sampler_rank0 = DistributedSampler(
                clip_sampler,
                num_replicas=2,
                rank=0,
                group_size=3,
            )
            indices = torch.tensor(list(iter(distributed_sampler_rank0)))
102
            assert len(distributed_sampler_rank0) == 6
103
            assert_equal(indices, torch.tensor([0, 2, 4, 10, 12, 14]))
104
105
106
107
108
109
110
111

            distributed_sampler_rank1 = DistributedSampler(
                clip_sampler,
                num_replicas=2,
                rank=1,
                group_size=3,
            )
            indices = torch.tensor(list(iter(distributed_sampler_rank1)))
112
            assert len(distributed_sampler_rank1) == 6
113
            assert_equal(indices, torch.tensor([5, 7, 9, 0, 2, 4]))
114

115
116

if __name__ == '__main__':
117
    pytest.main([__file__])