diff --git a/TTS/tts/models/vits.py b/TTS/tts/models/vits.py index 7500da61..f91115be 100644 --- a/TTS/tts/models/vits.py +++ b/TTS/tts/models/vits.py @@ -130,6 +130,7 @@ def wav_to_spec(y, n_fft, hop_length, win_length, center=False): pad_mode="reflect", normalized=False, onesided=True, + return_complex=False, ) spec = torch.sqrt(spec.pow(2).sum(-1) + 1e-6) @@ -197,6 +198,7 @@ def wav_to_mel(y, n_fft, num_mels, sample_rate, hop_length, win_length, fmin, fm pad_mode="reflect", normalized=False, onesided=True, + return_complex=False, ) spec = torch.sqrt(spec.pow(2).sum(-1) + 1e-6)