set audio duration mismatch tolerance to 0.01

This commit is contained in:
wgb14 2021-12-01 17:49:46 -05:00
parent b8beb00ecc
commit 64bd3f7df4

View File

@ -27,6 +27,7 @@ from lhotse import (
CutSet, CutSet,
KaldifeatFbank, KaldifeatFbank,
KaldifeatFbankConfig, KaldifeatFbankConfig,
set_audio_duration_mismatch_tolerance,
) )
# Torch's multithreaded behavior needs to be disabled or # Torch's multithreaded behavior needs to be disabled or
@ -100,6 +101,8 @@ def compute_fbank_gigaspeech_splits(args):
extractor = KaldifeatFbank(KaldifeatFbankConfig(device=device)) extractor = KaldifeatFbank(KaldifeatFbankConfig(device=device))
logging.info(f"device: {device}") logging.info(f"device: {device}")
set_audio_duration_mismatch_tolerance(0.01) # 10ms tolerance
for i in range(start, stop): for i in range(start, stop):
idx = f"{i + 1}".zfill(num_digits) idx = f"{i + 1}".zfill(num_digits)
logging.info(f"Processing {idx}/{num_splits}") logging.info(f"Processing {idx}/{num_splits}")