From 64bd3f7df4762484d3b996c80a7f8b1e71fd2ba1 Mon Sep 17 00:00:00 2001 From: wgb14 Date: Wed, 1 Dec 2021 17:49:46 -0500 Subject: [PATCH] set audio duration mismatch tolerance to 0.01 --- egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py b/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py index 429168e5c..6e7241cc5 100755 --- a/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py +++ b/egs/gigaspeech/ASR/local/compute_fbank_gigaspeech_splits.py @@ -27,6 +27,7 @@ from lhotse import ( CutSet, KaldifeatFbank, KaldifeatFbankConfig, + set_audio_duration_mismatch_tolerance, ) # Torch's multithreaded behavior needs to be disabled or @@ -100,6 +101,8 @@ def compute_fbank_gigaspeech_splits(args): extractor = KaldifeatFbank(KaldifeatFbankConfig(device=device)) logging.info(f"device: {device}") + set_audio_duration_mismatch_tolerance(0.01) # 10ms tolerance + for i in range(start, stop): idx = f"{i + 1}".zfill(num_digits) logging.info(f"Processing {idx}/{num_splits}")