shuffle full Librispeech for zipformer recipes (#869)

* shuffle libri
2025-12-11 06:55:27 +00:00 · 2023-02-03 11:54:57 +08:00 · 2023-02-03 11:54:57 +08:00 · 1e6d6f8160
commit 1e6d6f8160
parent e36ea89112
6 changed files with 18 additions and 17 deletions
--- a/egs/librispeech/ASR/pruned_transducer_stateless7/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7/train.py
@ -1043,10 +1043,10 @@ def run(rank, world_size, args):
    librispeech = LibriSpeechAsrDataModule(args)
    train_cuts = librispeech.train_clean_100_cuts()
    if params.full_libri:
-        train_cuts += librispeech.train_clean_360_cuts()
+        train_cuts = librispeech.train_all_shuf_cuts()
-        train_cuts += librispeech.train_other_500_cuts()
+    else:
        train_cuts = librispeech.train_clean_100_cuts()
    def remove_short_and_long_utt(c: Cut):
        # Keep only utterances with duration between 1 second and 20 seconds
--- a/egs/librispeech/ASR/pruned_transducer_stateless7_ctc/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7_ctc/train.py
@ -1072,10 +1072,10 @@ def run(rank, world_size, args):
    librispeech = LibriSpeechAsrDataModule(args)
    train_cuts = librispeech.train_clean_100_cuts()
    if params.full_libri:
-        train_cuts += librispeech.train_clean_360_cuts()
+        train_cuts = librispeech.train_all_shuf_cuts()
-        train_cuts += librispeech.train_other_500_cuts()
+    else:
        train_cuts = librispeech.train_clean_100_cuts()
    def remove_short_and_long_utt(c: Cut):
        # Keep only utterances with duration between 1 second and 20 seconds
--- a/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/train.py
@ -55,9 +55,9 @@ import torch.multiprocessing as mp
 import torch.nn as nn
 from asr_datamodule import LibriSpeechAsrDataModule
 from decoder import Decoder
 from frame_reducer import FrameReducer
 from joiner import Joiner
 from lconv import LConv
 from frame_reducer import FrameReducer
 from lhotse.cut import Cut
 from lhotse.dataset.sampling.base import CutSampler
 from lhotse.utils import fix_random_seed
@ -1063,10 +1063,10 @@ def run(rank, world_size, args):
    librispeech = LibriSpeechAsrDataModule(args)
    train_cuts = librispeech.train_clean_100_cuts()
    if params.full_libri:
-        train_cuts += librispeech.train_clean_360_cuts()
+        train_cuts = librispeech.train_all_shuf_cuts()
-        train_cuts += librispeech.train_other_500_cuts()
+    else:
        train_cuts = librispeech.train_clean_100_cuts()
    def remove_short_and_long_utt(c: Cut):
        # Keep only utterances with duration between 1 second and 20 seconds
--- a/egs/librispeech/ASR/pruned_transducer_stateless7_streaming/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless7_streaming/train.py
@ -1049,10 +1049,10 @@ def run(rank, world_size, args):
    librispeech = LibriSpeechAsrDataModule(args)
    train_cuts = librispeech.train_clean_100_cuts()
    if params.full_libri:
-        train_cuts += librispeech.train_clean_360_cuts()
+        train_cuts = librispeech.train_all_shuf_cuts()
-        train_cuts += librispeech.train_other_500_cuts()
+    else:
        train_cuts = librispeech.train_clean_100_cuts()
    def remove_short_and_long_utt(c: Cut):
        # Keep only utterances with duration between 1 second and 20 seconds
--- a/egs/librispeech/ASR/pruned_transducer_stateless8/train.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless8/train.py
@ -1154,10 +1154,10 @@ def run(rank, world_size, args):
    librispeech = LibriSpeech(manifest_dir=args.manifest_dir)
    train_cuts = librispeech.train_clean_100_cuts()
    if params.full_libri:
-        train_cuts += librispeech.train_clean_360_cuts()
+        train_cuts = librispeech.train_all_shuf_cuts()
-        train_cuts += librispeech.train_other_500_cuts()
+    else:
        train_cuts = librispeech.train_clean_100_cuts()
    train_cuts = filter_short_and_long_utterances(train_cuts, sp)
--- a/egs/librispeech/ASR/streaming_conformer_ctc/train.py
+++ b/egs/librispeech/ASR/streaming_conformer_ctc/train.py
@ -30,6 +30,7 @@ import torch.multiprocessing as mp
 import torch.nn as nn
 from asr_datamodule import LibriSpeechAsrDataModule
 from conformer import Conformer
 from lhotse.cut import Cut
 from lhotse.utils import fix_random_seed
 from torch import Tensor
 from torch.nn.parallel import DistributedDataParallel as DDP
@ -50,7 +51,7 @@ from icefall.utils import (
    setup_logger,
    str2bool,
 )
-from lhotse.cut import Cut
+
 def get_parser():
    parser = argparse.ArgumentParser(