From f673f8f74dd343889b6b81658e09fb61e33700ea Mon Sep 17 00:00:00 2001 From: Thorsten Mueller Date: Sat, 19 Dec 2020 22:51:22 +0100 Subject: [PATCH] Added support for npy output from tune-wavegrad --- TTS/bin/synthesize.py | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/TTS/bin/synthesize.py b/TTS/bin/synthesize.py index bd8a73f2..12ff4d30 100644 --- a/TTS/bin/synthesize.py +++ b/TTS/bin/synthesize.py @@ -37,8 +37,13 @@ def tts(model, vocoder_model, text, CONFIG, use_cuda, ap, use_gl, speaker_fileid if CONFIG.model == "Tacotron" and not use_gl: mel_postnet_spec = ap.out_linear_to_mel(mel_postnet_spec.T).T if not use_gl: + # Use if not computed noise schedule with tune_wavegrad beta = np.linspace(1e-6, 0.01, 50) vocoder_model.compute_noise_level(beta) + + # Use alternative when using output npy file from tune_wavegrad + # beta = np.load("output-tune-wavegrad.npy", allow_pickle=True).item() + # vocoder_model.compute_noise_level(beta['beta']) device_type = "cuda" if use_cuda else "cpu" waveform = vocoder_model.inference(torch.FloatTensor(mel_postnet_spec.T).to(device_type).unsqueeze(0))