From d495e4581f218435fa4117c11d23baef478d7932 Mon Sep 17 00:00:00 2001 From: Edresson Casanova Date: Thu, 21 Apr 2022 16:57:36 -0300 Subject: [PATCH] Add docs for VITS upsampling --- TTS/tts/models/vits.py | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/TTS/tts/models/vits.py b/TTS/tts/models/vits.py index 6251d3ff..31d057cd 100644 --- a/TTS/tts/models/vits.py +++ b/TTS/tts/models/vits.py @@ -454,6 +454,18 @@ class VitsArgs(Coqpit): freeze_waveform_decoder (bool): Freeze the waveform decoder weigths during training. Defaults to False. + + TTS_part_sample_rate (int): + If not None this sample rate will be used for training the Posterior Encoder, + flow, text_encoder and duration predictor. The decoder part (vocoder) will be + trained with the `config.audio.audio.sample_rate`. Defaults to None. + + interpolate_z (bool): + If `TTS_part_sample_rate` not None and this parameter True the nearest interpolation + will be used to upsampling the latent variable z with the sampling rate `TTS_part_sample_rate` + to the `config.audio.audio.sample_rate`. If it is False you will need to add extra + `upsample_rates_decoder` to match the shape. Defaults to True. + """ num_chars: int = 100