Merge pull request #4 from eginhard/fix-is-multilingual

fix(api): handle missing attribute in is_multi_lingual
This commit is contained in:
Enno Hermann 2024-03-07 07:59:02 +01:00 committed by GitHub
commit 7f83dea000
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 5 additions and 4 deletions

View File

@ -97,7 +97,7 @@ class TTS(nn.Module):
isinstance(self.model_name, str)
and "xtts" in self.model_name
or self.config
and ("xtts" in self.config.model or len(self.config.languages) > 1)
and ("xtts" in self.config.model or "languages" in self.config and len(self.config.languages) > 1)
):
return True
if hasattr(self.synthesizer.tts_model, "language_manager") and self.synthesizer.tts_model.language_manager:

View File

@ -4,6 +4,7 @@ import os
import random
from typing import Dict, List, Union
import mutagen
import numpy as np
import torch
import tqdm
@ -13,8 +14,6 @@ from TTS.tts.utils.data import prepare_data, prepare_stop_target, prepare_tensor
from TTS.utils.audio import AudioProcessor
from TTS.utils.audio.numpy_transforms import compute_energy as calculate_energy
import mutagen
# to prevent too many open files error as suggested here
# https://github.com/pytorch/pytorch/issues/11201#issuecomment-421146936
torch.multiprocessing.set_sharing_strategy("file_system")
@ -47,7 +46,9 @@ def string2filename(string):
def get_audio_size(audiopath):
extension = audiopath.rpartition(".")[-1].lower()
if extension not in {"mp3", "wav", "flac"}:
raise RuntimeError(f"The audio format {extension} is not supported, please convert the audio files to mp3, flac, or wav format!")
raise RuntimeError(
f"The audio format {extension} is not supported, please convert the audio files to mp3, flac, or wav format!"
)
audio_info = mutagen.File(audiopath).info
return int(audio_info.length * audio_info.sample_rate)