css10 dataset preprocessor

2021-02-09 15:11:26 +00:00 · 2021-02-09 15:11:26 +00:00 · 29d928d531
parent a2e7403ae8
commit 29d928d531
1 changed files with 14 additions and 0 deletions
--- a/TTS/tts/datasets/preprocess.py
+++ b/TTS/tts/datasets/preprocess.py
@ -166,6 +166,20 @@ def ljspeech(root_path, meta_file):
    return items


+def css10(root_path, meta_file):
+    """Normalizes the CSS10 dataset file to TTS format"""
+    txt_file = os.path.join(root_path, meta_file)
+    items = []
+    speaker_name = "ljspeech"
+    with open(txt_file, 'r') as ttf:
+        for line in ttf:
+            cols = line.split('|')
+            wav_file = os.path.join(root_path, cols[0])
+            text = cols[1]
+            items.append([text, wav_file, speaker_name])
+    return items
+
+
 def nancy(root_path, meta_file):
    """Normalizes the Nancy meta data file to TTS format"""
    txt_file = os.path.join(root_path, meta_file)