set use_phonemes false

This commit is contained in:
Eren Gölge 2021-05-19 01:27:26 +02:00
parent faedea4b60
commit 8a7c40736c
8 changed files with 17 additions and 15 deletions

View File

@ -25,7 +25,7 @@ class MyDataset(Dataset):
batch_group_size=0, batch_group_size=0,
min_seq_len=0, min_seq_len=0,
max_seq_len=float("inf"), max_seq_len=float("inf"),
use_phonemes=True, use_phonemes=False,
phoneme_cache_path=None, phoneme_cache_path=None,
phoneme_language="en-us", phoneme_language="en-us",
enable_eos_bos=False, enable_eos_bos=False,

View File

@ -4,8 +4,8 @@ import re
from packaging import version from packaging import version
from TTS.tts.utils.text.chinese_mandarin.phonemizer import chinese_text_to_phonemes
from TTS.tts.utils.text import cleaners from TTS.tts.utils.text import cleaners
from TTS.tts.utils.text.chinese_mandarin.phonemizer import chinese_text_to_phonemes
from TTS.tts.utils.text.symbols import _bos, _eos, _punctuations, make_symbols, phonemes, symbols from TTS.tts.utils.text.symbols import _bos, _eos, _punctuations, make_symbols, phonemes, symbols
# pylint: disable=unnecessary-comprehension # pylint: disable=unnecessary-comprehension
@ -27,12 +27,12 @@ PHONEME_PUNCTUATION_PATTERN = r"[" + _punctuations.replace(" ", "") + "]+"
def text2phone(text, language): def text2phone(text, language):
"""Convert graphemes to phonemes. """Convert graphemes to phonemes.
Parameters: Parameters:
text (str): text to phonemize text (str): text to phonemize
language (str): language of the text language (str): language of the text
Returns: Returns:
ph (str): phonemes as a string seperated by "|" ph (str): phonemes as a string seperated by "|"
ph = "ɪ|g|ˈ|z|æ|m|p|ə|l" ph = "ɪ|g|ˈ|z|æ|m|p|ə|l"
""" """
# TO REVIEW : How to have a good implementation for this? # TO REVIEW : How to have a good implementation for this?

View File

@ -102,8 +102,10 @@ class ModelManager(object):
output_model_path = os.path.join(output_path, "model_file.pth.tar") output_model_path = os.path.join(output_path, "model_file.pth.tar")
output_config_path = os.path.join(output_path, "config.json") output_config_path = os.path.join(output_path, "config.json")
# NOTE : band-aid for removing phoneme support # NOTE : band-aid for removing phoneme support
if 'needs_phonemizer' in model_item and model_item['needs_phonemizer']: if "needs_phonemizer" in model_item and model_item["needs_phonemizer"]:
raise RuntimeError(' [!] Use 🐸TTS <= v0.0.13 for this model. Current version does not support phoneme based models.') raise RuntimeError(
" [!] Use 🐸TTS <= v0.0.13 for this model. Current version does not support phoneme based models."
)
if os.path.exists(output_path): if os.path.exists(output_path):
print(f" > {model_name} is already downloaded.") print(f" > {model_name} is already downloaded.")
else: else:

View File

@ -15,7 +15,7 @@ config = AlignTTSConfig(
num_loader_workers=0, num_loader_workers=0,
num_val_loader_workers=0, num_val_loader_workers=0,
text_cleaner="english_cleaners", text_cleaner="english_cleaners",
use_phonemes=True, use_phonemes=False,
phoneme_language="en-us", phoneme_language="en-us",
phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"), phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"),
run_eval=True, run_eval=True,

View File

@ -15,7 +15,7 @@ config = GlowTTSConfig(
num_loader_workers=0, num_loader_workers=0,
num_val_loader_workers=0, num_val_loader_workers=0,
text_cleaner="english_cleaners", text_cleaner="english_cleaners",
use_phonemes=True, use_phonemes=False,
phoneme_language="en-us", phoneme_language="en-us",
phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"), phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"),
run_eval=True, run_eval=True,

View File

@ -15,7 +15,7 @@ config = SpeedySpeechConfig(
num_loader_workers=0, num_loader_workers=0,
num_val_loader_workers=0, num_val_loader_workers=0,
text_cleaner="english_cleaners", text_cleaner="english_cleaners",
use_phonemes=True, use_phonemes=False,
phoneme_language="en-us", phoneme_language="en-us",
phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"), phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"),
run_eval=True, run_eval=True,

View File

@ -16,7 +16,7 @@ config = Tacotron2Config(
num_loader_workers=0, num_loader_workers=0,
num_val_loader_workers=0, num_val_loader_workers=0,
text_cleaner="english_cleaners", text_cleaner="english_cleaners",
use_phonemes=True, use_phonemes=False,
phoneme_language="en-us", phoneme_language="en-us",
phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"), phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"),
run_eval=True, run_eval=True,

View File

@ -15,7 +15,7 @@ config = TacotronConfig(
num_loader_workers=0, num_loader_workers=0,
num_val_loader_workers=0, num_val_loader_workers=0,
text_cleaner="english_cleaners", text_cleaner="english_cleaners",
use_phonemes=True, use_phonemes=False,
phoneme_language="en-us", phoneme_language="en-us",
phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"), phoneme_cache_path=os.path.join(get_tests_output_path(), "train_outputs/phoneme_cache/"),
run_eval=True, run_eval=True,