refactor(xtts): use existing cleaners

This commit is contained in:
Enno Hermann 2024-11-22 22:08:05 +01:00
parent b45a7a4220
commit 54f4228a46
1 changed files with 1 additions and 17 deletions

View File

@ -15,6 +15,7 @@ from spacy.lang.zh import Chinese
from tokenizers import Tokenizer
from TTS.tts.layers.xtts.zh_num2words import TextNorm as zh_num2words
from TTS.tts.utils.text.cleaners import collapse_whitespace, lowercase
logger = logging.getLogger(__name__)
@ -72,8 +73,6 @@ def split_sentence(text, lang, text_split_length=250):
return text_splits
_whitespace_re = re.compile(r"\s+")
# List of (regular expression, replacement) pairs for abbreviations:
_abbreviations = {
"en": [
@ -564,14 +563,6 @@ def expand_numbers_multilingual(text, lang="en"):
return text
def lowercase(text):
return text.lower()
def collapse_whitespace(text):
return re.sub(_whitespace_re, " ", text)
def multilingual_cleaners(text, lang):
text = text.replace('"', "")
if lang == "tr":
@ -586,13 +577,6 @@ def multilingual_cleaners(text, lang):
return text
def basic_cleaners(text):
"""Basic pipeline that lowercases and collapses whitespace without transliteration."""
text = lowercase(text)
text = collapse_whitespace(text)
return text
def chinese_transliterate(text):
try:
import pypinyin