From c59b3f75b8c5b5e2f5588c7cdc0bc8958928e6ac Mon Sep 17 00:00:00 2001 From: Gerard Sant Muniesa <90964413+GerrySant@users.noreply.github.com> Date: Mon, 23 Jan 2023 11:56:30 +0100 Subject: [PATCH] Add Catalan text cleaners for Catalan support (#2295) --- TTS/tts/utils/text/cleaners.py | 22 +++++++++++++++++++++- 1 file changed, 21 insertions(+), 1 deletion(-) diff --git a/TTS/tts/utils/text/cleaners.py b/TTS/tts/utils/text/cleaners.py index f02f8fb4..a9261ecb 100644 --- a/TTS/tts/utils/text/cleaners.py +++ b/TTS/tts/utils/text/cleaners.py @@ -44,8 +44,25 @@ def remove_aux_symbols(text): def replace_symbols(text, lang="en"): + """Replace symbols based on the lenguage tag. + + Args: + text: + Input text. + lang: + Lenguage identifier. ex: "en", "fr", "pt", "ca". + + Returns: + The modified text + example: + input args: + text: "si l'avi cau, diguem-ho" + lang: "ca" + Output: + text: "si lavi cau, diguemho" + """ text = text.replace(";", ",") - text = text.replace("-", " ") + text = text.replace("-", " ") if lang != "ca" else text.replace("-", "") text = text.replace(":", ",") if lang == "en": text = text.replace("&", " and ") @@ -53,6 +70,9 @@ def replace_symbols(text, lang="en"): text = text.replace("&", " et ") elif lang == "pt": text = text.replace("&", " e ") + elif lang == "ca": + text = text.replace("&", " i ") + text = text.replace("'", "") return text