diff --git a/egs/multi_zh-hans/ASR/local/preprocess_kespeech.py b/egs/multi_zh-hans/ASR/local/preprocess_kespeech.py index af689c9d1..6f29aff4a 100644 --- a/egs/multi_zh-hans/ASR/local/preprocess_kespeech.py +++ b/egs/multi_zh-hans/ASR/local/preprocess_kespeech.py @@ -40,7 +40,7 @@ def normalize_text( def has_no_oov( sup: SupervisionSegment, - oov_pattern=re.compile(r"<(SIL|MUSIC|NOISE|OTHER)>"), + oov_pattern=re.compile(r"<(SIL|MUSIC|NOISE|OTHER|SPOKEN_NOISE)>"), ) -> bool: return oov_pattern.search(sup.text) is None