mirror of https://github.com/coqui-ai/TTS.git
add ```unique``` param to keep scglow models compatible (they are duplicate symbols ins the character set)
This commit is contained in:
parent
d9612a4351
commit
d2fa8add1f
|
@ -8,16 +8,17 @@ through Unidecode. For other data, you can modify _characters. See TRAINING_DATA
|
|||
|
||||
|
||||
def make_symbols(
|
||||
characters, phonemes=None, punctuations="!'(),-.:;? ", pad="_", eos="~", bos="^"
|
||||
characters, phonemes=None, punctuations="!'(),-.:;? ", pad="_", eos="~", bos="^", unique=True,
|
||||
): # pylint: disable=redefined-outer-name
|
||||
""" Function to create symbols and phonemes """
|
||||
""" Function to create symbols and phonemes
|
||||
TODO: create phonemes_to_id and symbols_to_id dicts here."""
|
||||
_symbols = list(characters)
|
||||
_symbols = [bos] + _symbols if len(bos) > 0 and bos is not None else _symbols
|
||||
_symbols = [eos] + _symbols if len(bos) > 0 and eos is not None else _symbols
|
||||
_symbols = [pad] + _symbols if len(bos) > 0 and pad is not None else _symbols
|
||||
_phonemes = None
|
||||
if phonemes is not None:
|
||||
_phonemes_sorted = sorted(list(set(phonemes)))
|
||||
_phonemes_sorted = sorted(list(set(phonemes))) if unique else sorted(list(phonemes)) # this is to keep previous models compatible.
|
||||
# Prepend "@" to ARPAbet symbols to ensure uniqueness (some are the same as uppercase letters):
|
||||
_arpabet = ["@" + s for s in _phonemes_sorted]
|
||||
# Export all symbols:
|
||||
|
|
Loading…
Reference in New Issue