cached_property for cutlet

2023-11-07 15:12:52 +01:00 · 2023-11-07 15:12:52 +01:00 · 8487e37376
parent 9dd31038f6
commit 8487e37376
1 changed files with 7 additions and 5 deletions
--- a/TTS/tts/layers/xtts/tokenizer.py
+++ b/TTS/tts/layers/xtts/tokenizer.py
@ -8,6 +8,7 @@ from hangul_romanize import Transliter
 from hangul_romanize.rule import academic
 from num2words import num2words
 from tokenizers import Tokenizer
 from yarl import cached_property
 from TTS.tts.layers.xtts.zh_num2words import TextNorm as zh_num2words
@ -535,7 +536,6 @@ DEFAULT_VOCAB_FILE = os.path.join(os.path.dirname(os.path.realpath(__file__)), "
 class VoiceBpeTokenizer:
    def __init__(self, vocab_file=None):
        self.tokenizer = None
        self.katsu = None
        if vocab_file is not None:
            self.tokenizer = Tokenizer.from_file(vocab_file)
        self.char_limits = {
@ -557,6 +557,11 @@ class VoiceBpeTokenizer:
            "ko": 95,
        }
    @cached_property
    def katsu(self):
        import cutlet
        return cutlet.Cutlet()
    def check_input_length(self, txt, lang):
        limit = self.char_limits.get(lang, 250)
        if len(txt) > limit:
@ -568,9 +573,6 @@ class VoiceBpeTokenizer:
            if lang == "zh-cn":
                txt = chinese_transliterate(txt)
        elif lang == "ja":                
            if self.katsu is None:
                import cutlet
                self.katsu = cutlet.Cutlet()
            txt = japanese_cleaners(txt, self.katsu)
        else:
            raise NotImplementedError()