kinetics.py 1.05 KB
Newer Older
1
2
3
4
5
6
7
from .video_utils import VideoClips
from .utils import list_dir
from .folder import make_dataset
from .vision import VisionDataset


class KineticsVideo(VisionDataset):
8
    def __init__(self, root, frames_per_clip, step_between_clips=1, transform=None):
9
10
11
12
13
14
15
16
17
        super(KineticsVideo, self).__init__(root)
        extensions = ('avi',)

        classes = list(sorted(list_dir(root)))
        class_to_idx = {classes[i]: i for i in range(len(classes))}
        self.samples = make_dataset(self.root, class_to_idx, extensions, is_valid_file=None)
        self.classes = classes
        video_list = [x[0] for x in self.samples]
        self.video_clips = VideoClips(video_list, frames_per_clip, step_between_clips)
18
        self.transform = transform
19
20
21
22
23
24
25
26

    def __len__(self):
        return self.video_clips.num_clips()

    def __getitem__(self, idx):
        video, audio, info, video_idx = self.video_clips.get_clip(idx)
        label = self.samples[video_idx][1]

27
28
29
        if self.transform is not None:
            video = self.transform(video)

30
        return video, audio, label