diff --git a/egs/mdcc/ASR/local/preprocess_mdcc.py b/egs/mdcc/ASR/local/preprocess_mdcc.py index f068425e7..86efd1f57 100755 --- a/egs/mdcc/ASR/local/preprocess_mdcc.py +++ b/egs/mdcc/ASR/local/preprocess_mdcc.py @@ -92,6 +92,8 @@ def get_word_segments(lines: List[str]) -> List[str]: if len(line.strip().split(" ")) > 1: segments = [] for segment in line.strip().split(" "): + if segment.strip() == "": + continue try: if not is_cjk(segment[0]): # en segment segments.append(segment)