revert asr data module

2025-12-11 06:55:27 +00:00 · 2024-01-15 19:59:48 +08:00 · 2024-01-15 19:59:48 +08:00 · eea46458c5
commit eea46458c5
parent e883bb60d4
3 changed files with 6 additions and 1179 deletions
--- a/egs/aishell/ASR/tdnn_lstm_ctc/asr_datamodule.py
+++ b/egs/aishell/ASR/tdnn_lstm_ctc/asr_datamodule.py
@ -30,7 +30,7 @@ from lhotse.dataset import (
    DynamicBucketingSampler,
    K2SpeechRecognitionDataset,
    PrecomputedFeatures,
-    SingleCutSampler,
+    SimpleCutSampler,
    SpecAugment,
 )
 from lhotse.dataset.input_strategies import OnTheFlyFeatures
@ -198,7 +198,7 @@ class AishellAsrDataModule:
        if self.args.enable_musan:
            logging.info("Enable MUSAN")
            transforms.append(
-                CutMix(cuts=cuts_musan, prob=0.5, snr=(10, 20), preserve_id=True)
+                CutMix(cuts=cuts_musan, p=0.5, snr=(10, 20), preserve_id=True)
            )
        else:
            logging.info("Disable MUSAN")
@ -278,8 +278,8 @@ class AishellAsrDataModule:
                drop_last=self.args.drop_last,
            )
        else:
-            logging.info("Using SingleCutSampler.")
-            train_sampler = SingleCutSampler(
+            logging.info("Using SimpleCutSampler.")
+            train_sampler = SimpleCutSampler(
                cuts_train,
                max_duration=self.args.max_duration,
                shuffle=self.args.shuffle,
--- a/egs/aishell/ASR/whisper/optim.py
+++ b/egs/aishell/ASR/whisper/optim.py
--- a/egs/aishell/ASR/whisper/optim.py
+++ b/egs/aishell/ASR/whisper/optim.py
@ -0,0 +1 @@
+../../../librispeech/ASR/zipformer/optim.py
--- a/egs/aishell/ASR/whisper/requirements.txt
+++ b/egs/aishell/ASR/whisper/requirements.txt
@ -1,6 +1,5 @@
 k2
 kaldialign
-#lhotse==1.18
 git+https://github.com/lhotse-speech/lhotse
 sentencepiece
 tensorboard
@ -8,4 +7,4 @@ librosa
 openai-whisper==20231117
 zhconv
 WeTextProcessing
-deepspeed
+deepspeed