Fix AudioEffector for mulaw (#3372)

Summary: When encoding audio with mulaw, the resulting data does not have header, and the StreamReader defaults to 16k Hz, which can strech/shrink the resulting waveform. Pull Request resolved: https://github.com/pytorch/audio/pull/3372 Reviewed By: hwangjeff Differential Revision: D46234772 Pulled By: mthrok fbshipit-source-id: 942c89a8cfe29b0b6f57b3e5b6c9dfd3524ca552

Fix AudioEffector for mulaw (#3372)
Summary: When encoding audio with mulaw, the resulting data does not have header, and the StreamReader defaults to 16k Hz, which can strech/shrink the resulting waveform. Pull Request resolved: https://github.com/pytorch/audio/pull/3372 Reviewed By: hwangjeff Differential Revision: D46234772 Pulled By: mthrok fbshipit-source-id: 942c89a8cfe29b0b6f57b3e5b6c9dfd3524ca552
af932cc7 · moto · Facebook GitHub Bot · 1b05ca7e · af932cc7 · af932cc7
Commit af932cc7 authored May 26, 2023 by moto Committed by Facebook GitHub Bot May 26, 2023
Show whitespace changes
Inline Side-by-side

Showing with 9 additions and 2 deletions

test/torchaudio_unittest/io/effector_test.py test/torchaudio_unittest/io/effector_test.py +5 -2

torchaudio/io/_effector.py torchaudio/io/_effector.py +4 -0

No files found.
--- a/test/torchaudio_unittest/io/effector_test.py
+++ b/test/torchaudio_unittest/io/effector_test.py
@@ -30,14 +30,17 @@ class EffectorTest(TorchaudioTestCase):
            ("ogg", "flac"),  # flac only supports s16 and s32
            ("ogg", "opus"),  # opus only supports 48k Hz
            ("ogg", "vorbis"),  # vorbis only supports stereo
+            # ("ogg", "vorbis", 44100),
+            # this fails with small descrepancy; 441024 vs 441000
+            # TODO: investigate
            ("wav", None),
            ("wav", "pcm_u8"),
            ("mp3", None),
+            ("mulaw", None, 44100),  # mulaw is encoded without header
        ]
    )
-    def test_formats(self, format, encoder):
+    def test_formats(self, format, encoder, sample_rate=8000):
        """Formats (some with restrictions) just work without an issue in effector"""
-        sample_rate = 8000

        effector = AudioEffector(format=format, encoder=encoder)
        original = get_sinusoid(n_channels=3, sample_rate=sample_rate, channels_first=False)

--- a/torchaudio/io/_effector.py
+++ b/torchaudio/io/_effector.py
@@ -267,6 +267,10 @@ class AudioEffector:
            muxer = self.format
            encoder = self.encoder
            option = {}
+            # Some formats are headerless, so need to provide these infomation.
+            if self.format == "mulaw":
+                option = {"sample_rate": f"{sample_rate}", "channels": f"{num_channels}"}
+
        else:  # PCM
            muxer = _get_muxer(waveform.dtype)
            encoder = None