fix synthesize.py

2020-02-19 18:24:02 +01:00 · 2020-02-19 18:24:02 +01:00 · e540a54959
parent f8ebf6abcd
commit e540a54959
1 changed files with 7 additions and 5 deletions
--- a/synthesize.py
+++ b/synthesize.py
@ -25,14 +25,16 @@ def tts(model,
    t_1 = time.time()
    use_vocoder_model = vocoder_model is not None
    waveform, alignment, _, postnet_output, stop_tokens = synthesis(
-        model, text, C, use_cuda, ap, speaker_id, False,
-        C.enable_eos_bos_chars)
+        model, text, C, use_cuda, ap, speaker_id, style_wav=False,
+        truncated=False, enable_eos_bos_chars=C.enable_eos_bos_chars,
+        use_griffin_lim=(not use_vocoder_model), do_trim_silence=True)
+
    if C.model == "Tacotron" and use_vocoder_model:
        postnet_output = ap.out_linear_to_mel(postnet_output.T).T
    # correct if there is a scale difference b/w two models
-    postnet_output = ap._denormalize(postnet_output)
-    postnet_output = ap_vocoder._normalize(postnet_output)
    if use_vocoder_model:
+        postnet_output = ap._denormalize(postnet_output)
+        postnet_output = ap_vocoder._normalize(postnet_output)
        vocoder_input = torch.FloatTensor(postnet_output.T).unsqueeze(0)
        waveform = vocoder_model.generate(
            vocoder_input.cuda() if use_cuda else vocoder_input,
@ -58,7 +60,7 @@ if __name__ == "__main__":
    parser.add_argument(
        'out_path',
        type=str,
-        help='Path to save final wav file.',
+        help='Path to save final wav file. Wav file will be names as the text given.',
    )
    parser.add_argument('--use_cuda',
                        type=bool,