Update VITS LJSpeech recipe

This commit is contained in:
Eren Gölge 2022-05-03 13:43:40 +02:00 committed by Eren G??lge
parent 0ef6bf2c28
commit 463d6f1b22
1 changed files with 5 additions and 13 deletions

View File

@ -2,11 +2,10 @@ import os
from trainer import Trainer, TrainerArgs
from TTS.config.shared_configs import BaseAudioConfig
from TTS.tts.configs.shared_configs import BaseDatasetConfig
from TTS.tts.configs.vits_config import VitsConfig
from TTS.tts.datasets import load_tts_samples
from TTS.tts.models.vits import Vits
from TTS.tts.models.vits import Vits, VitsAudioConfig
from TTS.tts.utils.text.tokenizer import TTSTokenizer
from TTS.utils.audio import AudioProcessor
@ -14,21 +13,13 @@ output_path = os.path.dirname(os.path.abspath(__file__))
dataset_config = BaseDatasetConfig(
name="ljspeech", meta_file_train="metadata.csv", path=os.path.join(output_path, "../LJSpeech-1.1/")
)
audio_config = BaseAudioConfig(
audio_config = VitsAudioConfig(
sample_rate=22050,
win_length=1024,
hop_length=256,
num_mels=80,
preemphasis=0.0,
ref_level_db=20,
log_func="np.log",
do_trim_silence=True,
trim_db=45,
mel_fmin=0,
mel_fmax=None,
spec_gain=1.0,
signal_norm=False,
do_amp_to_db_linear=False,
mel_fmax=None
)
config = VitsConfig(
@ -37,7 +28,7 @@ config = VitsConfig(
batch_size=32,
eval_batch_size=16,
batch_group_size=5,
num_loader_workers=0,
num_loader_workers=8,
num_eval_loader_workers=4,
run_eval=True,
test_delay_epochs=-1,
@ -52,6 +43,7 @@ config = VitsConfig(
mixed_precision=True,
output_path=output_path,
datasets=[dataset_config],
cudnn_benchmark=False
)
# INITIALIZE THE AUDIO PROCESSOR