modify according to PR reviews

2021-02-16 17:25:18 +01:00 · 2021-02-16 17:25:18 +01:00 · 9ab07f94e2
parent 42ba30eb8f
commit 9ab07f94e2
4 changed files with 10 additions and 6 deletions
--- a/TTS/tts/datasets/preprocess.py
+++ b/TTS/tts/datasets/preprocess.py
@ -372,10 +372,15 @@ def _voxcel_x(root_path, meta_file, voxcel_idx):
 def baker(root_path: str, meta_file: str) ->  List[List[str]]:
    """Normalizes the Baker meta data file to TTS format
-# ======================================== Baker (chinese mandarin single speaker) ===========================================
+    Args:
-def baker(root_path, meta_file):
+        root_path (str): path to the baker dataset
-    """Normalizes the Baker meta data file to TTS format"""
+        meta_file (str): name of the meta dataset containing names of wav to select and the transcript of the sentence  
    Returns:
        List[List[str]]: List of (text, wav_path, speaker_name) associated with each sentences
    """
    txt_file = os.path.join(root_path, meta_file)
    items = []
    speaker_name = "baker"
--- a/TTS/tts/utils/chinese_mandarin/numbers.py
+++ b/TTS/tts/utils/chinese_mandarin/numbers.py
@ -105,7 +105,7 @@ def _num2chinese(num :str, big=False, simp=True, o=False, twoalt=False) -> str:
-def _number_replace(match) -> str:
+def _number_replace(match: re.Match) -> str:
    """function to apply in a match, transform all numbers in a match by chinese characters
    Args:
--- a/TTS/tts/utils/synthesis.py
+++ b/TTS/tts/utils/synthesis.py
@ -220,7 +220,6 @@ def synthesis(model,
                model outputs.
            speaker_id (int): id of speaker
            style_wav (str | Dict[str, float]): Uses for style embedding of GST.
            style_wav (str): Uses for style embedding of GST.
            truncated (bool): keep model states after inference. It can be used
                for continuous inference at long texts.
            enable_eos_bos_chars (bool): enable special chars for end of sentence and start of sentence.
--- a/TTS/utils/synthesizer.py
+++ b/TTS/utils/synthesizer.py
@ -127,7 +127,7 @@ class Synthesizer(object):
        gst_style_input = None
        if self.tts_config.use_gst:
            if self.tts_config.gst["gst_style_input"] not in ["", {}]:
-                style_wav = self.tts_config.gst["gst_style_input"]
+                gst_style_input = self.tts_config.gst["gst_style_input"]
        for sen in sens:
            # synthesize voice