mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-08 09:32:20 +00:00
Update preprocess_commonvoice.py to fix text normalization bug. (#1181)
This commit is contained in:
parent
1dbbd7759e
commit
80d922c158
@ -45,7 +45,7 @@ def get_args():
|
||||
|
||||
def normalize_text(utt: str) -> str:
|
||||
utt = re.sub(r"[{0}]+".format("-"), " ", utt)
|
||||
return re.sub(r"[^a-zA-Z\s]", "", utt).upper()
|
||||
return re.sub(r"[^a-zA-Z\s']", "", utt).upper()
|
||||
|
||||
|
||||
def preprocess_commonvoice(
|
||||
|
Loading…
x
Reference in New Issue
Block a user