sam-accenture model preprocessor

2021-04-01 03:41:41 +02:00 · 2021-04-01 03:41:41 +02:00 · e84f120a04
parent e3c052382b
commit e84f120a04
1 changed files with 19 additions and 2 deletions
--- a/TTS/tts/datasets/preprocess.py
+++ b/TTS/tts/datasets/preprocess.py
@ -1,12 +1,12 @@
 import os
-from glob import glob
 import re
 import sys
+import xml.etree.ElementTree as ET
+from glob import glob
 from pathlib import Path
 from typing import List

 from tqdm import tqdm
-
 from TTS.tts.utils.generic_utils import split_dataset

 ####################
@ -168,6 +168,23 @@ def ljspeech(root_path, meta_file):
    return items


+def sam_accenture(root_path, meta_file):
+    """Normalizes the sam-accenture meta data file to TTS format
+    https://github.com/Sam-Accenture-Non-Binary-Voice/non-binary-voice-files"""
+    xml_file = os.path.join(root_path, 'voice_over_recordings', meta_file)
+    xml_root = ET.parse(xml_file).getroot()
+    items = []
+    speaker_name = "sam_accenture"
+    for item in xml_root.findall('./fileid'):
+        text = item.text
+        wav_file = os.path.join(root_path, 'vo_voice_quality_transformation', item.get('id')+'.wav')
+        if not os.path.exists(wav_file):
+            print(f' [!] {wav_file} in metafile does not exist. Skipping...')
+            continue
+        items.append([text, wav_file, speaker_name])
+    return items
+
+
 def ruslan(root_path, meta_file):
    """Normalizes the RUSLAN meta data file to TTS format
    https://ruslan-corpus.github.io/"""