mirror of https://github.com/coqui-ai/TTS.git
interpolate spectrogram in vocoder generic utils for matching sample
rates
This commit is contained in:
parent
ca3743539a
commit
5bd7238153
|
@ -7,6 +7,29 @@ from matplotlib import pyplot as plt
|
||||||
from TTS.tts.utils.visual import plot_spectrogram
|
from TTS.tts.utils.visual import plot_spectrogram
|
||||||
|
|
||||||
|
|
||||||
|
def interpolate_vocoder_input(scale_factor, spec):
|
||||||
|
"""Interpolate spectrogram by the scale factor.
|
||||||
|
It is mainly used to match the sampling rates of
|
||||||
|
the tts and vocoder models.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
scale_factor (float): scale factor to interpolate the spectrogram
|
||||||
|
spec (np.array): spectrogram to be interpolated
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
torch.tensor: interpolated spectrogram.
|
||||||
|
"""
|
||||||
|
print(" > before interpolation :", spec.shape)
|
||||||
|
spec = torch.tensor(spec).unsqueeze(0).unsqueeze(0)
|
||||||
|
spec = torch.nn.functional.interpolate(spec,
|
||||||
|
scale_factor=scale_factor,
|
||||||
|
recompute_scale_factor=True,
|
||||||
|
mode='bilinear',
|
||||||
|
align_corners=False).squeeze(0)
|
||||||
|
print(" > after interpolation :", spec.shape)
|
||||||
|
return spec
|
||||||
|
|
||||||
|
|
||||||
def plot_results(y_hat, y, ap, global_step, name_prefix):
|
def plot_results(y_hat, y, ap, global_step, name_prefix):
|
||||||
""" Plot vocoder model results """
|
""" Plot vocoder model results """
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue