From 3b6ce04332245e4c87bfec1896b26e403882f887 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Eren=20G=C3=B6lge?= Date: Mon, 15 Feb 2021 13:02:29 +0100 Subject: [PATCH] Update TTS/bin/find_unique_chars.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: Jörg Thalheim --- TTS/bin/find_unique_chars.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/TTS/bin/find_unique_chars.py b/TTS/bin/find_unique_chars.py index 654a3ff9..f9b6827b 100644 --- a/TTS/bin/find_unique_chars.py +++ b/TTS/bin/find_unique_chars.py @@ -35,13 +35,13 @@ def main(): preprocessor = get_preprocessor_by_name(args.dataset) items = preprocessor(os.path.dirname(args.meta_file), os.path.basename(args.meta_file)) - texts = " ".join([item[0] for item in items]) + texts = "".join(item[0] for item in items) chars = set(texts) - lower_chars = set(texts.lower()) + lower_chars = filter(lambda c: c.islower(), chars) print(f" > Number of unique characters: {len(chars)}") print(f" > Unique characters: {''.join(sorted(chars))}") print(f" > Unique lower characters: {''.join(sorted(lower_chars))}") if __name__ == "__main__": - main() \ No newline at end of file + main()