Add RMS based norm in save_wav method

2022-04-21 08:26:27 -03:00 · 2022-04-21 08:26:27 -03:00 · 21cbfe964e
parent bb7a645e7a
commit 21cbfe964e
2 changed files with 7 additions and 2 deletions
--- a/TTS/server/server.py
+++ b/TTS/server/server.py
@ -111,7 +111,8 @@ synthesizer = Synthesizer(
    use_cuda=args.use_cuda,
 )

-use_multi_speaker = hasattr(synthesizer.tts_model, "num_speakers") and synthesizer.tts_model.num_speakers > 1
+use_multi_speaker = hasattr(synthesizer.tts_model, "num_speakers") and (synthesizer.tts_model.num_speakers > 1 or synthesizer.tts_speakers_file is not None)
+print("Multispeaker?", use_multi_speaker, synthesizer.tts_model.num_speakers)
 speaker_manager = getattr(synthesizer.tts_model, "speaker_manager", None)
 # TODO: set this from SpeakerManager
 use_gst = synthesizer.tts_config.get("use_gst", False)
--- a/TTS/utils/audio.py
+++ b/TTS/utils/audio.py
@ -859,7 +859,11 @@ class AudioProcessor(object):
            path (str): Path to a output file.
            sr (int, optional): Sampling rate used for saving to the file. Defaults to None.
        """
-        wav_norm = wav * (32767 / max(0.01, np.max(np.abs(wav))))
+        if self.do_rms_norm:
+            wav_norm = self.rms_volume_norm(wav, self.db_level) * 32767
+        else:
+            wav_norm = wav * (32767 / max(0.01, np.max(np.abs(wav))))
+
        scipy.io.wavfile.write(path, sr if sr else self.sample_rate, wav_norm.astype(np.int16))

    def get_duration(self, filename: str) -> float: