From 92fa988aecc2937ac11927e7f0758bc94ee79ded Mon Sep 17 00:00:00 2001 From: Eren G??lge Date: Mon, 13 Nov 2023 13:44:06 +0100 Subject: [PATCH] Fixup --- TTS/tts/models/xtts.py | 3 --- 1 file changed, 3 deletions(-) diff --git a/TTS/tts/models/xtts.py b/TTS/tts/models/xtts.py index 0f79ad69..b277c3ac 100644 --- a/TTS/tts/models/xtts.py +++ b/TTS/tts/models/xtts.py @@ -369,11 +369,8 @@ class Xtts(BaseTTS): audios = [] speaker_embedding = None for file_path in audio_paths: - # load the audio in 24khz to avoid issued with multiple sr references audio = load_audio(file_path, load_sr) audio = audio[:, : load_sr * max_ref_length].to(self.device) - if audio.shape[0] > 1: - audio = audio.mean(0, keepdim=True) if sound_norm_refs: audio = (audio / torch.abs(audio).max()) * 0.75 if librosa_trim_db is not None: