diff --git a/egs/baker_zh/TTS/matcha/export_onnx.py b/egs/baker_zh/TTS/matcha/export_onnx.py index 6133cc4db..6e4e6c237 100755 --- a/egs/baker_zh/TTS/matcha/export_onnx.py +++ b/egs/baker_zh/TTS/matcha/export_onnx.py @@ -5,6 +5,13 @@ This script exports a Matcha-TTS model to ONNX. Note that the model outputs fbank. You need to use a vocoder to convert it to audio. See also ./export_onnx_hifigan.py + +python3 ./matcha/export_onnx.py \ + --exp-dir ./matcha/exp-1 \ + --epoch 2000 \ + --tokens ./data/tokens.txt \ + --cmvn ./data/fbank/cmvn.json + """ import argparse diff --git a/egs/baker_zh/TTS/matcha/onnx_pretrained.py b/egs/baker_zh/TTS/matcha/onnx_pretrained.py index 615a3a0c8..9711fe052 100755 --- a/egs/baker_zh/TTS/matcha/onnx_pretrained.py +++ b/egs/baker_zh/TTS/matcha/onnx_pretrained.py @@ -1,6 +1,16 @@ #!/usr/bin/env python3 # Copyright 2024 Xiaomi Corp. (authors: Fangjun Kuang) +""" +python3 ./matcha/onnx_pretrained.py \ + --acoustic-model ./model-steps-4.onnx \ + --vocoder ./hifigan_v2.onnx \ + --tokens ./data/tokens.txt \ + --lexicon ./lexicon.txt \ + --input-text "当夜幕降临,星光点点,伴随着微风拂面,我在静谧中感受着时光的流转,思念如涟漪荡漾,梦境如画卷展开,我与自然融为一体,沉静在这片宁静的美丽之中,感受着生命的奇迹与温柔。" \ + --output-wav ./b.wav +""" + import argparse import datetime as dt import re