From 62054da8f147280dd5eddd1daa803807783a7588 Mon Sep 17 00:00:00 2001 From: Eren G Date: Mon, 30 Jul 2018 13:51:25 +0200 Subject: [PATCH] load audio change --- datasets/LJSpeech.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/datasets/LJSpeech.py b/datasets/LJSpeech.py index 69aff0e0..377855dc 100644 --- a/datasets/LJSpeech.py +++ b/datasets/LJSpeech.py @@ -30,7 +30,7 @@ class MyDataset(Dataset): def load_wav(self, filename): try: - audio = librosa.core.load(filename, sr=self.sample_rate) + audio = librosa.core.load(filename, sr=self.sample_rate)[0] return audio except RuntimeError as e: print(" !! Cannot read file : {}".format(filename)) @@ -65,7 +65,7 @@ class MyDataset(Dataset): text = self.frames[idx][1] text = np.asarray(text_to_sequence( text, [self.cleaners]), dtype=np.int32) - wav = np.asarray(self.load_wav(wav_name)[0], dtype=np.float32) + wav = np.asarray(self.load_wav(wav_name), dtype=np.float32) sample = {'text': text, 'wav': wav, 'item_idx': self.frames[idx][0]} return sample