Update comments

2021-10-20 18:21:26 +00:00 · 2021-10-20 18:21:26 +00:00 · 0e768dd4c5
parent 7c2cb7cc30
commit 0e768dd4c5
3 changed files with 11 additions and 19 deletions
--- a/TTS/tts/layers/losses.py
+++ b/TTS/tts/layers/losses.py
@ -410,11 +410,6 @@ class TacotronLoss(torch.nn.Module):
            return_dict["postnet_ssim_loss"] = postnet_ssim_loss

        return_dict["loss"] = loss
-
-        # check if any loss is NaN
-        for key, loss in return_dict.items():
-            if torch.isnan(loss):
-                raise RuntimeError(f" [!] NaN loss with {key}.")
        return return_dict


--- a/TTS/tts/layers/tacotron/attentions.py
+++ b/TTS/tts/layers/tacotron/attentions.py
@ -126,27 +126,24 @@ class GravesAttention(nn.Module):


 class OriginalAttention(nn.Module):
-    """Bahdanau Attention with various optional modifications. Proposed below.
+    """Bahdanau Attention with various optional modifications.
    - Location sensitive attnetion: https://arxiv.org/abs/1712.05884
    - Forward Attention: https://arxiv.org/abs/1807.06736 + state masking at inference
    - Using sigmoid instead of softmax normalization
    - Attention windowing at inference time

    Note:
-        Location Sensitive Attention is an attention mechanism that extends the additive attention mechanism
-    to use cumulative attention weights from previous decoder time steps as an additional feature.
+        Location Sensitive Attention extends the additive attention mechanism
+    to use cumulative attention weights from previous decoder time steps with the current time step features.

-        Forward attention considers only the alignment paths that satisfy the monotonic condition at each
-    decoder timestep. The modified attention probabilities at each timestep are computed recursively
-    using a forward algorithm.
+        Forward attention computes most probable monotonic alignment. The modified attention probabilities at each
+    timestep are computed recursively by the forward algorithm.

-        Transition agent for forward attention is further proposed, which helps the attention mechanism
-    to make decisions whether to move forward or stay at each decoder timestep.
-
-        Attention windowing applies a sliding windows to time steps of the input tensor centering at the last
-    time step with the largest attention weight. It is especially useful at inference to keep the attention
-    alignment diagonal.
+        Transition agent in the forward attention explicitly gates the attention mechanism whether to move forward or
+    stay at each decoder timestep.

+        Attention windowing is a inductive prior that prevents the model from attending to previous and future timesteps
+    beyond a certain window.

    Args:
        query_dim (int): number of channels in the query tensor.
--- a/TTS/tts/models/init.py
+++ b/TTS/tts/models/init.py
@ -2,7 +2,7 @@ from TTS.tts.utils.text.symbols import make_symbols, parse_symbols
 from TTS.utils.generic_utils import find_module


-def setup_model(config):
+def setup_model(config, speaker_manager: "SpeakerManager" = None):
    print(" > Using model: {}".format(config.model))
    # fetch the right model implementation.
    if "base_model" in config and config["base_model"] is not None:
@ -31,7 +31,7 @@ def setup_model(config):
        config.model_params.num_chars = num_chars
    if "model_args" in config:
        config.model_args.num_chars = num_chars
-    model = MyModel(config)
+    model = MyModel(config, speaker_manager=speaker_manager)
    return model