Update TTS/bin/find_unique_chars.py

Co-authored-by: Jörg Thalheim <Mic92@users.noreply.github.com>
This commit is contained in:
Eren Gölge 2021-02-15 13:02:29 +01:00 committed by Eren Gölge
parent 19e2193c40
commit 39fbf2fe84
1 changed files with 3 additions and 3 deletions

View File

@ -35,13 +35,13 @@ def main():
preprocessor = get_preprocessor_by_name(args.dataset)
items = preprocessor(os.path.dirname(args.meta_file), os.path.basename(args.meta_file))
texts = " ".join([item[0] for item in items])
texts = "".join(item[0] for item in items)
chars = set(texts)
lower_chars = set(texts.lower())
lower_chars = filter(lambda c: c.islower(), chars)
print(f" > Number of unique characters: {len(chars)}")
print(f" > Unique characters: {''.join(sorted(chars))}")
print(f" > Unique lower characters: {''.join(sorted(lower_chars))}")
if __name__ == "__main__":
main()
main()