test_io.py 11 KB
Newer Older
moto's avatar
moto committed
1
2
import os
import math
moto's avatar
moto committed
3
4
import shutil
import tempfile
David Pollack's avatar
David Pollack committed
5
import unittest
moto's avatar
moto committed
6

7
import torch
Soumith Chintala's avatar
Soumith Chintala committed
8
import torchaudio
moto's avatar
moto committed
9

moto's avatar
moto committed
10
11
12
13
14
15
16
17
18
19
20
21
from .common_utils import BACKENDS, BACKENDS_MP3, get_asset_path


def create_temp_assets_dir():
    """
    Creates a temporary directory and moves all files from test/assets there.
    Returns a Tuple[string, TemporaryDirectory] which is the folder path
    and object.
    """
    tmp_dir = tempfile.TemporaryDirectory()
    shutil.copytree(get_asset_path(), os.path.join(tmp_dir.name, "assets"))
    return tmp_dir.name, tmp_dir
Vincent QB's avatar
Vincent QB committed
22
23


David Pollack's avatar
David Pollack committed
24
class Test_LoadSave(unittest.TestCase):
25
    test_dirpath, test_dir = create_temp_assets_dir()
26
27
    test_filepath = os.path.join(test_dirpath, "assets",
                                 "steam-train-whistle-daniel_simon.mp3")
Vincent QB's avatar
Vincent QB committed
28
29
    test_filepath_wav = os.path.join(test_dirpath, "assets",
                                     "steam-train-whistle-daniel_simon.wav")
Soumith Chintala's avatar
Soumith Chintala committed
30

David Pollack's avatar
David Pollack committed
31
    def test_1_save(self):
32
        for backend in BACKENDS_MP3:
moto's avatar
moto committed
33
34
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
35
            with self.subTest():
moto's avatar
moto committed
36
37
                torchaudio.set_audio_backend(backend)
                self._test_1_save(self.test_filepath, False)
Vincent QB's avatar
Vincent QB committed
38

39
        for backend in BACKENDS:
moto's avatar
moto committed
40
41
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
42
            with self.subTest():
moto's avatar
moto committed
43
44
                torchaudio.set_audio_backend(backend)
                self._test_1_save(self.test_filepath_wav, True)
Vincent QB's avatar
Vincent QB committed
45
46

    def _test_1_save(self, test_filepath, normalization):
David Pollack's avatar
David Pollack committed
47
        # load signal
Vincent QB's avatar
Vincent QB committed
48
        x, sr = torchaudio.load(test_filepath, normalization=normalization)
David Pollack's avatar
David Pollack committed
49
50
51
52
53
54
55
56
57
58
59
60
61
62

        # check save
        new_filepath = os.path.join(self.test_dirpath, "test.wav")
        torchaudio.save(new_filepath, x, sr)
        self.assertTrue(os.path.isfile(new_filepath))
        os.unlink(new_filepath)

        # check automatic normalization
        x /= 1 << 31
        torchaudio.save(new_filepath, x, sr)
        self.assertTrue(os.path.isfile(new_filepath))
        os.unlink(new_filepath)

        # test save 1d tensor
David Pollack's avatar
David Pollack committed
63
        x = x[0, :]  # get mono signal
Soumith Chintala's avatar
Soumith Chintala committed
64
        x.squeeze_()  # remove channel dim
David Pollack's avatar
David Pollack committed
65
66
67
68
69
70
        torchaudio.save(new_filepath, x, sr)
        self.assertTrue(os.path.isfile(new_filepath))
        os.unlink(new_filepath)

        # don't allow invalid sizes as inputs
        with self.assertRaises(ValueError):
David Pollack's avatar
David Pollack committed
71
            x.unsqueeze_(1)  # L x C not C x L
David Pollack's avatar
David Pollack committed
72
73
74
75
76
            torchaudio.save(new_filepath, x, sr)

        with self.assertRaises(ValueError):
            x.squeeze_()
            x.unsqueeze_(1)
Soumith Chintala's avatar
Soumith Chintala committed
77
            x.unsqueeze_(0)  # 1 x L x 1
David Pollack's avatar
David Pollack committed
78
79
80
81
            torchaudio.save(new_filepath, x, sr)

        # don't save to folders that don't exist
        with self.assertRaises(OSError):
82
83
            new_filepath = os.path.join(self.test_dirpath, "no-path",
                                        "test.wav")
David Pollack's avatar
David Pollack committed
84
            torchaudio.save(new_filepath, x, sr)
Soumith Chintala's avatar
Soumith Chintala committed
85

Vincent QB's avatar
Vincent QB committed
86
    def test_1_save_sine(self):
87
        for backend in BACKENDS:
moto's avatar
moto committed
88
89
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
90
            with self.subTest():
moto's avatar
moto committed
91
92
                torchaudio.set_audio_backend(backend)
                self._test_1_save_sine()
Vincent QB's avatar
Vincent QB committed
93
94
95

    def _test_1_save_sine(self):

96
        # save created file
97
98
        sinewave_filepath = os.path.join(self.test_dirpath, "assets",
                                         "sinewave.wav")
99
100
101
102
        sr = 16000
        freq = 440
        volume = 0.3

103
        y = (torch.cos(
104
            2 * math.pi * torch.arange(0, 4 * sr).float() * freq / sr))
David Pollack's avatar
David Pollack committed
105
        y.unsqueeze_(0)
106
        # y is between -1 and 1, so must scale
David Pollack's avatar
David Pollack committed
107
        y = (y * volume * (2**31)).long()
108
109
        torchaudio.save(sinewave_filepath, y, sr)
        self.assertTrue(os.path.isfile(sinewave_filepath))
110

111
        # test precision
David Pollack's avatar
David Pollack committed
112
        new_precision = 32
113
        new_filepath = os.path.join(self.test_dirpath, "test.wav")
David Pollack's avatar
David Pollack committed
114
115
116
117
118
        si, ei = torchaudio.info(sinewave_filepath)
        torchaudio.save(new_filepath, y, sr, new_precision)
        si32, ei32 = torchaudio.info(new_filepath)
        self.assertEqual(si.precision, 16)
        self.assertEqual(si32.precision, new_precision)
119
120
        os.unlink(new_filepath)

David Pollack's avatar
David Pollack committed
121
    def test_2_load(self):
122
        for backend in BACKENDS_MP3:
moto's avatar
moto committed
123
124
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
125
            with self.subTest():
moto's avatar
moto committed
126
127
                torchaudio.set_audio_backend(backend)
                self._test_2_load(self.test_filepath, 278756)
Vincent QB's avatar
Vincent QB committed
128

129
        for backend in BACKENDS:
moto's avatar
moto committed
130
131
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
132
            with self.subTest():
moto's avatar
moto committed
133
134
                torchaudio.set_audio_backend(backend)
                self._test_2_load(self.test_filepath_wav, 276858)
Vincent QB's avatar
Vincent QB committed
135
136

    def _test_2_load(self, test_filepath, length):
David Pollack's avatar
David Pollack committed
137
        # check normal loading
Vincent QB's avatar
Vincent QB committed
138
        x, sr = torchaudio.load(test_filepath)
David Pollack's avatar
David Pollack committed
139
        self.assertEqual(sr, 44100)
Vincent QB's avatar
Vincent QB committed
140
        self.assertEqual(x.size(), (2, length))
David Pollack's avatar
David Pollack committed
141
142
143

        # check offset
        offset = 15
Vincent QB's avatar
Vincent QB committed
144
145
        x, _ = torchaudio.load(test_filepath)
        x_offset, _ = torchaudio.load(test_filepath, offset=offset)
146
        self.assertTrue(x[:, offset:].allclose(x_offset))
David Pollack's avatar
David Pollack committed
147
148
149

        # check number of frames
        n = 201
Vincent QB's avatar
Vincent QB committed
150
        x, _ = torchaudio.load(test_filepath, num_frames=n)
David Pollack's avatar
David Pollack committed
151
152
153
        self.assertTrue(x.size(), (2, n))

        # check channels first
Vincent QB's avatar
Vincent QB committed
154
155
        x, _ = torchaudio.load(test_filepath, channels_first=False)
        self.assertEqual(x.size(), (length, 2))
David Pollack's avatar
David Pollack committed
156
157
158
159
160
161
162
163
164
165

        # check raising errors
        with self.assertRaises(OSError):
            torchaudio.load("file-does-not-exist.mp3")

        with self.assertRaises(OSError):
            tdir = os.path.join(
                os.path.dirname(self.test_dirpath), "torchaudio")
            torchaudio.load(tdir)

Vincent QB's avatar
Vincent QB committed
166
    def test_2_load_nonormalization(self):
167
        for backend in BACKENDS_MP3:
moto's avatar
moto committed
168
169
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
170
            with self.subTest():
moto's avatar
moto committed
171
172
                torchaudio.set_audio_backend(backend)
                self._test_2_load_nonormalization(self.test_filepath, 278756)
Vincent QB's avatar
Vincent QB committed
173
174
175
176
177
178
179
180
181
182
183
184

    def _test_2_load_nonormalization(self, test_filepath, length):

        # check no normalizing
        x, _ = torchaudio.load(test_filepath, normalization=False)
        self.assertTrue(x.min() <= -1.0)
        self.assertTrue(x.max() >= 1.0)

        # check different input tensor type
        x, _ = torchaudio.load(test_filepath, torch.LongTensor(), normalization=False)
        self.assertTrue(isinstance(x, torch.LongTensor))

David Pollack's avatar
David Pollack committed
185
    def test_3_load_and_save_is_identity(self):
186
        for backend in BACKENDS:
moto's avatar
moto committed
187
188
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
189
            with self.subTest():
moto's avatar
moto committed
190
191
                torchaudio.set_audio_backend(backend)
                self._test_3_load_and_save_is_identity()
Vincent QB's avatar
Vincent QB committed
192
193

    def _test_3_load_and_save_is_identity(self):
194
195
196
197
198
199
200
201
202
        input_path = os.path.join(self.test_dirpath, 'assets', 'sinewave.wav')
        tensor, sample_rate = torchaudio.load(input_path)
        output_path = os.path.join(self.test_dirpath, 'test.wav')
        torchaudio.save(output_path, tensor, sample_rate)
        tensor2, sample_rate2 = torchaudio.load(output_path)
        self.assertTrue(tensor.allclose(tensor2))
        self.assertEqual(sample_rate, sample_rate2)
        os.unlink(output_path)

moto's avatar
moto committed
203
    @unittest.skipIf(any(be not in BACKENDS for be in ["sox", "soundfile"]), "sox and soundfile are not available")
Vincent QB's avatar
Vincent QB committed
204
205
206
207
208
209
210
    def test_3_load_and_save_is_identity_across_backend(self):
        with self.subTest():
            self._test_3_load_and_save_is_identity_across_backend("sox", "soundfile")
        with self.subTest():
            self._test_3_load_and_save_is_identity_across_backend("soundfile", "sox")

    def _test_3_load_and_save_is_identity_across_backend(self, backend1, backend2):
moto's avatar
moto committed
211
212
213
        torchaudio.set_audio_backend(backend1)
        input_path = os.path.join(self.test_dirpath, 'assets', 'sinewave.wav')
        tensor1, sample_rate1 = torchaudio.load(input_path)
Vincent QB's avatar
Vincent QB committed
214

moto's avatar
moto committed
215
216
        output_path = os.path.join(self.test_dirpath, 'test.wav')
        torchaudio.save(output_path, tensor1, sample_rate1)
Vincent QB's avatar
Vincent QB committed
217

moto's avatar
moto committed
218
219
        torchaudio.set_audio_backend(backend2)
        tensor2, sample_rate2 = torchaudio.load(output_path)
Vincent QB's avatar
Vincent QB committed
220
221
222
223
224

        self.assertTrue(tensor1.allclose(tensor2))
        self.assertEqual(sample_rate1, sample_rate2)
        os.unlink(output_path)

David Pollack's avatar
David Pollack committed
225
    def test_4_load_partial(self):
226
        for backend in BACKENDS_MP3:
moto's avatar
moto committed
227
228
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
229
            with self.subTest():
moto's avatar
moto committed
230
231
                torchaudio.set_audio_backend(backend)
                self._test_4_load_partial()
Vincent QB's avatar
Vincent QB committed
232
233

    def _test_4_load_partial(self):
David Pollack's avatar
David Pollack committed
234
235
        num_frames = 101
        offset = 201
236
237
238
239
        # load entire mono sinewave wav file, load a partial copy and then compare
        input_sine_path = os.path.join(self.test_dirpath, 'assets', 'sinewave.wav')
        x_sine_full, sr_sine = torchaudio.load(input_sine_path)
        x_sine_part, _ = torchaudio.load(input_sine_path, num_frames=num_frames, offset=offset)
240
        l1_error = x_sine_full[:, offset:(num_frames + offset)].sub(x_sine_part).abs().sum().item()
241
        # test for the correct number of samples and that the correct portion was loaded
David Pollack's avatar
David Pollack committed
242
        self.assertEqual(x_sine_part.size(1), num_frames)
243
244
245
246
247
248
249
        self.assertEqual(l1_error, 0.)
        # create a two channel version of this wavefile
        x_2ch_sine = x_sine_full.repeat(1, 2)
        out_2ch_sine_path = os.path.join(self.test_dirpath, 'assets', '2ch_sinewave.wav')
        torchaudio.save(out_2ch_sine_path, x_2ch_sine, sr_sine)
        x_2ch_sine_load, _ = torchaudio.load(out_2ch_sine_path, num_frames=num_frames, offset=offset)
        os.unlink(out_2ch_sine_path)
David Pollack's avatar
David Pollack committed
250
        l1_error = x_2ch_sine_load.sub(x_2ch_sine[:, offset:(offset + num_frames)]).abs().sum().item()
251
252
253
254
255
        self.assertEqual(l1_error, 0.)

        # test with two channel mp3
        x_2ch_full, sr_2ch = torchaudio.load(self.test_filepath, normalization=True)
        x_2ch_part, _ = torchaudio.load(self.test_filepath, normalization=True, num_frames=num_frames, offset=offset)
256
        l1_error = x_2ch_full[:, offset:(offset + num_frames)].sub(x_2ch_part).abs().sum().item()
David Pollack's avatar
David Pollack committed
257
        self.assertEqual(x_2ch_part.size(1), num_frames)
258
259
260
261
262
        self.assertEqual(l1_error, 0.)

        # check behavior if number of samples would exceed file length
        offset_ns = 300
        x_ns, _ = torchaudio.load(input_sine_path, num_frames=100000, offset=offset_ns)
David Pollack's avatar
David Pollack committed
263
        self.assertEqual(x_ns.size(1), x_sine_full.size(1) - offset_ns)
264
265
266
267
268

        # check when offset is beyond the end of the file
        with self.assertRaises(RuntimeError):
            torchaudio.load(input_sine_path, offset=100000)

David Pollack's avatar
David Pollack committed
269
    def test_5_get_info(self):
270
        for backend in BACKENDS:
moto's avatar
moto committed
271
272
            if backend == 'sox_io':
                continue
Vincent QB's avatar
Vincent QB committed
273
            with self.subTest():
moto's avatar
moto committed
274
275
                torchaudio.set_audio_backend(backend)
                self._test_5_get_info()
Vincent QB's avatar
Vincent QB committed
276
277

    def _test_5_get_info(self):
278
        input_path = os.path.join(self.test_dirpath, 'assets', 'sinewave.wav')
David Pollack's avatar
David Pollack committed
279
280
281
282
283
284
        channels, samples, rate, precision = (1, 64000, 16000, 16)
        si, ei = torchaudio.info(input_path)
        self.assertEqual(si.channels, channels)
        self.assertEqual(si.length, samples)
        self.assertEqual(si.rate, rate)
        self.assertEqual(ei.bits_per_sample, precision)