Fixes #1314 (#1316)

457148ea · Vincent QB · GitHub · 49860425 · 457148ea · 457148ea
Unverified Commit 457148ea authored Feb 26, 2021 by Vincent QB Committed by GitHub Feb 26, 2021
Showing with 26 additions and 8 deletions

docs/source/functional.rst docs/source/functional.rst +10 -0

docs/source/transforms.rst docs/source/transforms.rst +7 -0

torchaudio/functional/functional.py torchaudio/functional/functional.py +9 -8

No files found.
--- a/docs/source/functional.rst
+++ b/docs/source/functional.rst
@@ -208,3 +208,13 @@ vad
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
 .. autofunction:: compute_kaldi_pitch
+:hidden:`spectral_centroid`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autofunction:: spectral_centroid
+:hidden:`apply_codec`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autofunction:: apply_codec
--- a/docs/source/transforms.rst
+++ b/docs/source/transforms.rst
@@ -136,6 +136,13 @@ Transforms are common audio transforms. They can be chained together using :clas
  .. automethod:: forward
+:hidden:`SpectralCentroid`
+~~~~~~~~~~~~~~~~~~~~~~~~~~~~~
+.. autoclass:: SpectralCentroid
+  .. automethod:: forward
 :hidden:`Vad`
 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~

--- a/torchaudio/functional/functional.py
+++ b/torchaudio/functional/functional.py
@@ -1011,24 +1011,25 @@ def apply_codec(
    bits_per_sample: Optional[int] = None,
 ) -> Tensor:
    r"""
-    Applies codecs as a form of augmentation
+    Apply codecs as a form of augmentation.
    Args:
-        waveform (Tensor): Audio data. Must be 2 dimensional. See also ```channels_first```
+        waveform (Tensor): Audio data. Must be 2 dimensional. See also ```channels_first```.
-        sample_rate (int): Sample rate of the audio waveform
+        sample_rate (int): Sample rate of the audio waveform.
-        format (str): file format
+        format (str): File format.
        channels_first (bool):
            When True, both the input and output Tensor have dimension ``[channel, time]``.
            Otherwise, they have dimension ``[time, channel]``.
        compression (float): Used for formats other than WAV.
-            For mor details see :py:func:`torchaudio.backend.sox_io_backend.save`
+            For mor details see :py:func:`torchaudio.backend.sox_io_backend.save`.
        encoding (str, optional): Changes the encoding for the supported formats.
-            For more details see :py:func:`torchaudio.backend.sox_io_backend.save`
+            For more details see :py:func:`torchaudio.backend.sox_io_backend.save`.
        bits_per_sample (int, optional): Changes the bit depth for the supported formats.
-            For more details see :py:func:`torchaudio.backend.sox_io_backend.save`
+            For more details see :py:func:`torchaudio.backend.sox_io_backend.save`.
    Returns:
        torch.Tensor: Resulting Tensor.
-        If ``channels_first=True``, it has ``[channel, time]`` else ``[time, channel]``
+        If ``channels_first=True``, it has ``[channel, time]`` else ``[time, channel]``.
    """
    bytes = io.BytesIO()
    torchaudio.backend.sox_io_backend.save(bytes,