data loader fix

2018-03-22 14:06:33 -07:00 · 2018-03-22 14:06:33 -07:00 · b1beb1f876
parent 33937f54d0
commit b1beb1f876
1 changed files with 7 additions and 7 deletions
--- a/datasets/LJSpeech.py
+++ b/datasets/LJSpeech.py
@ -98,6 +98,12 @@ class LJSpeechDataset(Dataset):
            mel = [self.ap.melspectrogram(w).astype('float32') for w in wav]
            mel_lengths = [m.shape[1] for m in mel]
            # compute 'stop token' targets
            stop_targets = [np.array([0.]*mel_len) for mel_len in mel_lengths]
            # PAD stop targets
            stop_targets = prepare_stop_target(stop_targets, self.outputs_per_step)
            # PAD sequences with largest length of the batch
            text = prepare_data(text).astype(np.int32)
            wav = prepare_data(wav)
@ -121,12 +127,6 @@ class LJSpeechDataset(Dataset):
            # update mel lengths
            mel_lengths = [l+pad_len for l in mel_lengths]
            # compute 'stop token' targets
            stop_targets = [np.array([0.]*mel_len) for mel_len in mel_lengths]
            # PAD stop targets
            stop_targets = prepare_stop_target(stop_targets, self.outputs_per_step)
            # B x T x D
            linear = linear.transpose(0, 2, 1)
            mel = mel.transpose(0, 2, 1)