diff --git a/TTS/bin/synthesize.py b/TTS/bin/synthesize.py index 40852bdf..bd8a73f2 100644 --- a/TTS/bin/synthesize.py +++ b/TTS/bin/synthesize.py @@ -37,6 +37,9 @@ def tts(model, vocoder_model, text, CONFIG, use_cuda, ap, use_gl, speaker_fileid if CONFIG.model == "Tacotron" and not use_gl: mel_postnet_spec = ap.out_linear_to_mel(mel_postnet_spec.T).T if not use_gl: + beta = np.linspace(1e-6, 0.01, 50) + vocoder_model.compute_noise_level(beta) + device_type = "cuda" if use_cuda else "cpu" waveform = vocoder_model.inference(torch.FloatTensor(mel_postnet_spec.T).to(device_type).unsqueeze(0)) if use_cuda and not use_gl: