From 7dfd753d91689888e660b1ca596649faca530090 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Eren=20G=C3=B6lge?= Date: Sat, 5 Feb 2022 20:34:17 +0100 Subject: [PATCH] Add a cheap trick to avoid short audio clips --- TTS/tts/datasets/dataset.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/TTS/tts/datasets/dataset.py b/TTS/tts/datasets/dataset.py index 499e6b7b..af726818 100644 --- a/TTS/tts/datasets/dataset.py +++ b/TTS/tts/datasets/dataset.py @@ -229,7 +229,8 @@ class TTSDataset(Dataset): # after phonemization the text length may change # this is a shareful 🤭 hack to prevent longer phonemes # TODO: find a better fix - if len(token_ids) > self.max_text_len: + if len(token_ids) > self.max_text_len or len(wav) < self.min_audio_len: + self.rescue_item_idx += 1 return self.load_data(self.rescue_item_idx) # get f0 values