Update preprocess_gigaspeech2.py

This commit is contained in:
Yifan Yang 2024-04-02 15:49:03 +08:00 committed by GitHub
parent aa17542e9e
commit f5b8d5dad2
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -75,12 +75,12 @@ def normalize_text(
text = re.sub(r"\u00B0", "องศา", text) # °
# Remove blank symbols
text = re.sub(r"\s", "", utt)
text = re.sub(r"\s", "", text)
else:
text = re.sub(r"\s+", " ", text).strip()
return utt
return text
def preprocess_gigaspeech2(args):