From 78c3897599d415d9312f57d61fde715feacef595 Mon Sep 17 00:00:00 2001 From: Thomas Werkmeister Date: Tue, 23 Jul 2019 09:47:52 +0200 Subject: [PATCH] root path speaker matching added data root path in speaker matching for mailabs, this way you don't need to start at the very bottom of the folder hierarchy if you want to explicitly define metafiles. --- datasets/preprocess.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/datasets/preprocess.py b/datasets/preprocess.py index 9dd7a610..a3701c4d 100644 --- a/datasets/preprocess.py +++ b/datasets/preprocess.py @@ -82,14 +82,14 @@ def mailabs(root_path, meta_files=None): # meta_files = [f.strip() for f in meta_files.split(",")] items = [] for idx, csv_file in enumerate(csv_files): + txt_file = os.path.join(root_path, csv_file) # determine speaker based on folder structure... - speaker_name_match = speaker_regex.search(csv_file) + speaker_name_match = speaker_regex.search(txt_file) if speaker_name_match is None: continue speaker_name = speaker_name_match.group("speaker_name") print(" | > {}".format(csv_file)) folder = folders[idx] - txt_file = os.path.join(root_path, csv_file) with open(txt_file, 'r') as ttf: for line in ttf: cols = line.split('|')