diff --git a/egs/bengaliai_speech/ASR/local/preprocess_bengaliai_speech.py b/egs/bengaliai_speech/ASR/local/preprocess_bengaliai_speech.py index fbcfa3ce5..1d3cd5772 100755 --- a/egs/bengaliai_speech/ASR/local/preprocess_bengaliai_speech.py +++ b/egs/bengaliai_speech/ASR/local/preprocess_bengaliai_speech.py @@ -38,7 +38,7 @@ def get_args(): def normalize_text(utt: str) -> str: - punc = '~`!#$%^&*()_+-=|\';":/.,?><~·!@#¥%……&*()——+-=“:’;、。,?》《{}' + punc = "~`!#$%^&*()_+-=|';\":/.,?><~·!@#¥%……&*()——+-=“:’;、。,?》《{}" return re.sub(r"[{0}]+".format(punc), "", utt).upper()