From c19891ee8e1c5b699e214a1910da32b889c3e31e Mon Sep 17 00:00:00 2001 From: Yuekai Zhang Date: Fri, 26 Jan 2024 10:23:26 +0800 Subject: [PATCH] add remove long short --- egs/wenetspeech/ASR/whisper/train.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/egs/wenetspeech/ASR/whisper/train.py b/egs/wenetspeech/ASR/whisper/train.py index 8e55200e1..2316a3c3b 100644 --- a/egs/wenetspeech/ASR/whisper/train.py +++ b/egs/wenetspeech/ASR/whisper/train.py @@ -834,8 +834,9 @@ def run(rank, world_size, args): # ) return False return True - - train_dl = wenetspeech.train_dataloaders(wenetspeech.train_cuts(remove_short_and_long_utt)) + train_cuts = wenetspeech.train_cuts() + train_cuts = train_cuts.filter(remove_short_and_long_utt) + train_dl = wenetspeech.train_dataloaders(train_cuts) valid_dl = wenetspeech.valid_dataloaders(wenetspeech.valid_cuts()) scaler = GradScaler(enabled=params.use_fp16, init_scale=1.0)