From 657c5442e5339581e5c09168f5212112a342d97a Mon Sep 17 00:00:00 2001 From: Edresson Casanova Date: Thu, 28 Apr 2022 15:40:16 -0300 Subject: [PATCH] Remove audio padding before mel spec extraction --- TTS/vocoder/datasets/gan_dataset.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/TTS/vocoder/datasets/gan_dataset.py b/TTS/vocoder/datasets/gan_dataset.py index 08fdb0a3..a782067e 100644 --- a/TTS/vocoder/datasets/gan_dataset.py +++ b/TTS/vocoder/datasets/gan_dataset.py @@ -115,8 +115,8 @@ class GANDataset(Dataset): audio, mel = self.cache[idx] else: audio = self.ap.load_wav(wavpath) - audio, _ = self._pad_short_samples(audio) mel = self.ap.melspectrogram(audio) + audio, mel = self._pad_short_samples(audio, mel) else: # load precomputed features