From 6eaecab0ca543b92b7bc23c3d51d2619448a6120 Mon Sep 17 00:00:00 2001 From: Aya Jafari Date: Tue, 10 Oct 2023 23:02:31 -0300 Subject: [PATCH] fixed bugs in fastpitch tts synthesis --- TTS/tts/models/forward_tts.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/TTS/tts/models/forward_tts.py b/TTS/tts/models/forward_tts.py index 6d1e90ca..8dfc6c03 100644 --- a/TTS/tts/models/forward_tts.py +++ b/TTS/tts/models/forward_tts.py @@ -395,6 +395,7 @@ class ForwardTTS(BaseTTS): - x_mask: :math:`(B, 1, T_{en})` - g: :math:`(B, C)` """ + g = g.type(torch.LongTensor) if hasattr(self, "emb_g"): g = self.emb_g(g) # [B, C, 1] if g is not None: @@ -683,9 +684,11 @@ class ForwardTTS(BaseTTS): # encoder pass o_en, x_mask, g, _ = self._forward_encoder(x, x_mask, g) # duration predictor pass + o_en = o_en.squeeze() o_dr_log = self.duration_predictor(o_en, x_mask) o_dr = self.format_durations(o_dr_log, x_mask).squeeze(1) y_lengths = o_dr.sum(1) + # pitch predictor pass o_pitch = None if self.args.use_pitch: