Update train.py (#773)

Fix transducer lstm egs bug as mentioned in issue 579
2025-12-11 06:55:27 +00:00 · 2022-12-23 11:38:22 +08:00 · 2022-12-23 11:38:22 +08:00 · 7eb2d0edb6
commit 7eb2d0edb6
parent 070c77e724
1 changed files with 0 additions and 10 deletions
--- a/egs/librispeech/ASR/transducer_lstm/train.py
+++ b/egs/librispeech/ASR/transducer_lstm/train.py
@ -629,18 +629,8 @@ def run(rank, world_size, args):
        # Keep only utterances with duration between 1 second and 20 seconds
        return 1.0 <= c.duration <= 20.0
    num_in_total = len(train_cuts)
    train_cuts = train_cuts.filter(remove_short_and_long_utt)
    num_left = len(train_cuts)
    num_removed = num_in_total - num_left
    removed_percent = num_removed / num_in_total * 100
    logging.info(f"Before removing short and long utterances: {num_in_total}")
    logging.info(f"After removing short and long utterances: {num_left}")
    logging.info(f"Removed {num_removed} utterances ({removed_percent:.5f}%)")
    train_dl = librispeech.train_dataloaders(train_cuts)
    valid_cuts = librispeech.dev_clean_cuts()