Update capacitron_layers.py (#1664)

crashing because of dimension miss match at line no. 57 [batch, 256] vs [batch , 1, 512] enc_out = torch.cat([enc_out, speaker_embedding], dim=-1)
2022-08-15 14:38:50 +05:30 · 2022-08-15 14:38:50 +05:30 · e4db7c51b5
parent bfc63829ac
commit e4db7c51b5
1 changed files with 1 additions and 0 deletions
--- a/TTS/tts/layers/tacotron/capacitron_layers.py
+++ b/TTS/tts/layers/tacotron/capacitron_layers.py
@ -53,6 +53,7 @@ class CapacitronVAE(nn.Module):
                text_summary_out = self.text_summary_net(text_inputs, input_lengths).to(reference_mels.device)
                enc_out = torch.cat([enc_out, text_summary_out], dim=-1)
            if speaker_embedding is not None:
+                speaker_embedding = torch.squeeze(speaker_embedding)
                enc_out = torch.cat([enc_out, speaker_embedding], dim=-1)

            # Feed the output of the ref encoder and information about text/speaker into