Fix vocoder interface (#1895)

57c8b97e · moto · c4fc8f90 · 57c8b97e · 57c8b97e
Commit 57c8b97e authored Oct 18, 2021 by moto
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

torchaudio/pipelines/_tts/impl.py torchaudio/pipelines/_tts/impl.py +2 -2

torchaudio/pipelines/_tts/interface.py torchaudio/pipelines/_tts/interface.py +2 -1

No files found.
--- a/torchaudio/pipelines/_tts/impl.py
+++ b/torchaudio/pipelines/_tts/impl.py
@@ -83,7 +83,7 @@ class _WaveRNNVocoder(torch.nn.Module, Tacotron2TTSBundle.Vocoder):
    def sample_rate(self):
        return self._sample_rate

-    def forward(self, mel_spec, lengths):
+    def forward(self, mel_spec, lengths=None):
        mel_spec = torch.exp(mel_spec)
        mel_spec = 20 * torch.log10(torch.clamp(mel_spec, min=1e-5))
        if self._min_level_db is not None:
@@ -120,7 +120,7 @@ class _GriffinLimVocoder(torch.nn.Module, Tacotron2TTSBundle.Vocoder):
    def sample_rate(self):
        return self._sample_rate

-    def forward(self, mel_spec, lengths):
+    def forward(self, mel_spec, lengths=None):
        mel_spec = torch.exp(mel_spec)
        mel_spec = mel_spec.clone().detach().requires_grad_(True)
        spec = self._inv_mel(mel_spec)

--- a/torchaudio/pipelines/_tts/interface.py
+++ b/torchaudio/pipelines/_tts/interface.py
@@ -47,7 +47,7 @@ class _Vocoder(ABC):
        """

    @abstractmethod
-    def __call__(self, specgrams: Tensor, lengths: Optional[Tensor]) -> Tuple[Tensor, Optional[Tensor]]:
+    def __call__(self, specgrams: Tensor, lengths: Optional[Tensor] = None) -> Tuple[Tensor, Optional[Tensor]]:
        """Generate waveform from the given input, such as spectrogram

        See :func:`torchaudio.pipelines.Tacotron2TTSBundle.get_vocoder` for the usage.
@@ -58,6 +58,7 @@ class _Vocoder(ABC):
                The expected shape depends on the implementation.
            lengths (Tensor, or None, optional):
                The valid length of each sample in the batch. Shape: `(batch, )`.
+                (Default: `None`)

        Returns:
            (Tensor, Optional[Tensor]):