diff --git a/models/tacotron.py b/models/tacotron.py index c27656da..532db6b8 100644 --- a/models/tacotron.py +++ b/models/tacotron.py @@ -14,10 +14,11 @@ class Tacotron(nn.Module): self.linear_dim = linear_dim self.embedding = nn.Embedding(len(symbols), embedding_dim, padding_idx=padding_idx) - print(" | > Number of characted : {}".format(len(symbols))) + print(" | > Number of characters : {}".format(len(symbols))) self.embedding.weight.data.normal_(0, 0.3) self.encoder = Encoder(embedding_dim) self.decoder = Decoder(256, mel_dim, r) + self.stopnet = nn.Sequential(nn.Linear(80, 1), nn.Sigmoid()) self.postnet = CBHG(mel_dim, K=8, projections=[256, mel_dim]) self.last_linear = nn.Linear(mel_dim * 2, linear_dim) @@ -32,6 +33,7 @@ class Tacotron(nn.Module): # Reshape # batch x time x dim mel_outputs = mel_outputs.view(B, -1, self.mel_dim) + stop_tokens = self.stopnet(mel_outputs) linear_outputs = self.postnet(mel_outputs) linear_outputs = self.last_linear(linear_outputs) - return mel_outputs, linear_outputs, alignments + return mel_outputs, linear_outputs, alignments, stop_tokens