mirror of https://github.com/coqui-ai/TTS.git
add mozilla preprocessor
This commit is contained in:
parent
5a91db56cc
commit
a60c9ee47d
|
@ -42,6 +42,30 @@ def tweb(root_path, meta_file):
|
||||||
# return {'text': texts, 'wavs': wavs}
|
# return {'text': texts, 'wavs': wavs}
|
||||||
|
|
||||||
|
|
||||||
|
def mozilla(root_path, meta_files):
|
||||||
|
"""Normalizes Mozilla meta data files to TTS format"""
|
||||||
|
import glob
|
||||||
|
meta_files = glob.glob(root_path + "**/batch*.txt", recursive=True)
|
||||||
|
folders = [os.path.dirname(f.strip()) for f in meta_files]
|
||||||
|
items = []
|
||||||
|
for idx, meta_file in enumerate(meta_files):
|
||||||
|
print(" | > {}".format(meta_file))
|
||||||
|
folder = folders[idx]
|
||||||
|
txt_file = os.path.join(root_path, meta_file)
|
||||||
|
with open(txt_file, 'r') as ttf:
|
||||||
|
for line in ttf:
|
||||||
|
cols = line.split('|')
|
||||||
|
wav_file = os.path.join(root_path, folder, 'wavs_no_processing', cols[1].strip())
|
||||||
|
if os.path.isfile(wav_file):
|
||||||
|
text = cols[0].strip()
|
||||||
|
items.append([text, wav_file])
|
||||||
|
else:
|
||||||
|
print(" > Error: {}", line)
|
||||||
|
continue
|
||||||
|
random.shuffle(items)
|
||||||
|
return items
|
||||||
|
|
||||||
|
|
||||||
def mailabs(root_path, meta_files):
|
def mailabs(root_path, meta_files):
|
||||||
"""Normalizes M-AI-Labs meta data files to TTS format"""
|
"""Normalizes M-AI-Labs meta data files to TTS format"""
|
||||||
folders = [os.path.dirname(f.strip()) for f in meta_files.split(",")]
|
folders = [os.path.dirname(f.strip()) for f in meta_files.split(",")]
|
||||||
|
|
Loading…
Reference in New Issue