Fix bug in streaming_conformer_ctc egs (#862)

* Update train.py Fix transducer lstm egs bug as mentioned in issue 579 * Update train.py fix dataloader bug
2025-08-09 10:02:22 +00:00 · 2023-01-31 15:19:50 +08:00 · 2023-01-31 15:19:50 +08:00 · e9019511eb
commit e9019511eb
parent e277e31e37
1 changed files with 18 additions and 3 deletions
--- a/egs/librispeech/ASR/streaming_conformer_ctc/train.py
+++ b/egs/librispeech/ASR/streaming_conformer_ctc/train.py
@ -50,7 +50,7 @@ from icefall.utils import (
    setup_logger,
    str2bool,
 )
-
+from lhotse.cut import Cut

 def get_parser():
    parser = argparse.ArgumentParser(
@ -645,8 +645,23 @@ def run(rank, world_size, args):
        optimizer.load_state_dict(checkpoints["optimizer"])

    librispeech = LibriSpeechAsrDataModule(args)
-    train_dl = librispeech.train_dataloaders()
-    valid_dl = librispeech.valid_dataloaders()
+
+    if params.full_libri:
+        train_cuts = librispeech.train_all_shuf_cuts()
+    else:
+        train_cuts = librispeech.train_clean_100_cuts()
+
+    def remove_short_and_long_utt(c: Cut):
+        # Keep only utterances with duration between 1 second and 20 seconds
+        return 1.0 <= c.duration <= 20.0
+
+    train_cuts = train_cuts.filter(remove_short_and_long_utt)
+
+    train_dl = librispeech.train_dataloaders(train_cuts)
+
+    valid_cuts = librispeech.dev_clean_cuts()
+    valid_cuts += librispeech.dev_other_cuts()
+    valid_dl = librispeech.valid_dataloaders(valid_cuts)

    scan_pessimistic_batches_for_oom(
        model=model,