diff --git a/egs/vctk/TTS/vits/train.py b/egs/vctk/TTS/vits/train.py index 300b9a8a1..9b2f2b246 100755 --- a/egs/vctk/TTS/vits/train.py +++ b/egs/vctk/TTS/vits/train.py @@ -342,7 +342,7 @@ def prepare_input( torch.Tensor([speaker_map[sid] for sid in batch["speakers"]]).int().to(device) ) - tokens = tokenizer.texts_to_token_ids( + tokens = tokenizer.tokens_to_token_ids( tokens, intersperse_blank=True, add_sos=True, add_eos=True ) tokens = k2.RaggedTensor(tokens)