diff --git a/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py b/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py index 429168e5c..6e7241cc5 100755 --- a/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py +++ b/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py @@ -27,6 +27,7 @@ from lhotse import ( CutSet, KaldifeatFbank, KaldifeatFbankConfig, + set_audio_duration_mismatch_tolerance, ) # Torch's multithreaded behavior needs to be disabled or @@ -100,6 +101,8 @@ def compute_fbank_gigaspeech_splits(args): extractor = KaldifeatFbank(KaldifeatFbankConfig(device=device)) logging.info(f"device: {device}") + set_audio_duration_mismatch_tolerance(0.01) # 10ms tolerance + for i in range(start, stop): idx = f"{i + 1}".zfill(num_digits) logging.info(f"Processing {idx}/{num_splits}")