mirror of https://github.com/coqui-ai/TTS.git
Add preprocessor for TWEB dataset
This commit is contained in:
parent
d38872a4d0
commit
4587c72a03
|
@ -13,10 +13,20 @@ def tts_cache(root_path, meta_file):
|
||||||
return items
|
return items
|
||||||
|
|
||||||
|
|
||||||
# def tweb(root_path, meta_file):
|
def tweb(root_path, meta_file):
|
||||||
# # TODO
|
"""Normalize TWEB dataset.
|
||||||
# pass
|
https://www.kaggle.com/bryanpark/the-world-english-bible-speech-dataset
|
||||||
# return
|
"""
|
||||||
|
txt_file = os.path.join(root_path, meta_file)
|
||||||
|
items = []
|
||||||
|
with open(txt_file, 'r') as ttf:
|
||||||
|
for line in ttf:
|
||||||
|
cols = line.split('\t')
|
||||||
|
wav_file = os.path.join(root_path, cols[0]+'.wav')
|
||||||
|
text = cols[1]
|
||||||
|
items.append([text, wav_file])
|
||||||
|
random.shuffle(items)
|
||||||
|
return items
|
||||||
|
|
||||||
|
|
||||||
# def kusal(root_path, meta_file):
|
# def kusal(root_path, meta_file):
|
||||||
|
|
Loading…
Reference in New Issue