mirror of https://github.com/coqui-ai/TTS.git
Make style
This commit is contained in:
parent
46940cb64b
commit
b702b39b52
|
@ -252,7 +252,12 @@ class BaseTacotron(BaseTTS):
|
||||||
|
|
||||||
def compute_capacitron_VAE_embedding(self, inputs, reference_mel_info, text_info=None, speaker_embedding=None):
|
def compute_capacitron_VAE_embedding(self, inputs, reference_mel_info, text_info=None, speaker_embedding=None):
|
||||||
"""Capacitron Variational Autoencoder"""
|
"""Capacitron Variational Autoencoder"""
|
||||||
(VAE_outputs, posterior_distribution, prior_distribution, capacitron_beta,) = self.capacitron_vae_layer(
|
(
|
||||||
|
VAE_outputs,
|
||||||
|
posterior_distribution,
|
||||||
|
prior_distribution,
|
||||||
|
capacitron_beta,
|
||||||
|
) = self.capacitron_vae_layer(
|
||||||
reference_mel_info,
|
reference_mel_info,
|
||||||
text_info,
|
text_info,
|
||||||
speaker_embedding, # pylint: disable=not-callable
|
speaker_embedding, # pylint: disable=not-callable
|
||||||
|
|
|
@ -676,7 +676,12 @@ class Tortoise(BaseTTS):
|
||||||
), "Too much text provided. Break the text up into separate segments and re-try inference."
|
), "Too much text provided. Break the text up into separate segments and re-try inference."
|
||||||
|
|
||||||
if voice_samples is not None:
|
if voice_samples is not None:
|
||||||
(auto_conditioning, diffusion_conditioning, _, _,) = self.get_conditioning_latents(
|
(
|
||||||
|
auto_conditioning,
|
||||||
|
diffusion_conditioning,
|
||||||
|
_,
|
||||||
|
_,
|
||||||
|
) = self.get_conditioning_latents(
|
||||||
voice_samples,
|
voice_samples,
|
||||||
return_mels=True,
|
return_mels=True,
|
||||||
latent_averaging_mode=latent_averaging_mode,
|
latent_averaging_mode=latent_averaging_mode,
|
||||||
|
|
|
@ -97,9 +97,7 @@ def main():
|
||||||
use_ne_hifigan=True, # if it is true it will keep the non-enhanced keys on the output checkpoint
|
use_ne_hifigan=True, # if it is true it will keep the non-enhanced keys on the output checkpoint
|
||||||
)
|
)
|
||||||
# define audio config
|
# define audio config
|
||||||
audio_config = XttsAudioConfig(
|
audio_config = XttsAudioConfig(sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000)
|
||||||
sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000
|
|
||||||
)
|
|
||||||
# training parameters config
|
# training parameters config
|
||||||
config = GPTTrainerConfig(
|
config = GPTTrainerConfig(
|
||||||
output_path=OUT_PATH,
|
output_path=OUT_PATH,
|
||||||
|
|
|
@ -98,9 +98,7 @@ def main():
|
||||||
gpt_use_perceiver_resampler=True,
|
gpt_use_perceiver_resampler=True,
|
||||||
)
|
)
|
||||||
# define audio config
|
# define audio config
|
||||||
audio_config = XttsAudioConfig(
|
audio_config = XttsAudioConfig(sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000)
|
||||||
sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000
|
|
||||||
)
|
|
||||||
# training parameters config
|
# training parameters config
|
||||||
config = GPTTrainerConfig(
|
config = GPTTrainerConfig(
|
||||||
output_path=OUT_PATH,
|
output_path=OUT_PATH,
|
||||||
|
|
|
@ -88,9 +88,7 @@ model_args = GPTArgs(
|
||||||
gpt_stop_audio_token=8193,
|
gpt_stop_audio_token=8193,
|
||||||
use_ne_hifigan=True,
|
use_ne_hifigan=True,
|
||||||
)
|
)
|
||||||
audio_config = XttsAudioConfig(
|
audio_config = XttsAudioConfig(sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000)
|
||||||
sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000
|
|
||||||
)
|
|
||||||
config = GPTTrainerConfig(
|
config = GPTTrainerConfig(
|
||||||
epochs=1,
|
epochs=1,
|
||||||
output_path=OUT_PATH,
|
output_path=OUT_PATH,
|
||||||
|
|
|
@ -88,9 +88,7 @@ model_args = GPTArgs(
|
||||||
gpt_use_perceiver_resampler=True,
|
gpt_use_perceiver_resampler=True,
|
||||||
use_ne_hifigan=True,
|
use_ne_hifigan=True,
|
||||||
)
|
)
|
||||||
audio_config = XttsAudioConfig(
|
audio_config = XttsAudioConfig(sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000)
|
||||||
sample_rate=22050, dvae_sample_rate=22050, output_sample_rate=24000
|
|
||||||
)
|
|
||||||
config = GPTTrainerConfig(
|
config = GPTTrainerConfig(
|
||||||
epochs=1,
|
epochs=1,
|
||||||
output_path=OUT_PATH,
|
output_path=OUT_PATH,
|
||||||
|
|
Loading…
Reference in New Issue