revert asr data module

This commit is contained in:
Yuekai Zhang 2024-01-15 19:59:48 +08:00
parent e883bb60d4
commit eea46458c5
3 changed files with 6 additions and 1179 deletions

View File

@ -30,7 +30,7 @@ from lhotse.dataset import (
DynamicBucketingSampler,
K2SpeechRecognitionDataset,
PrecomputedFeatures,
SingleCutSampler,
SimpleCutSampler,
SpecAugment,
)
from lhotse.dataset.input_strategies import OnTheFlyFeatures
@ -198,7 +198,7 @@ class AishellAsrDataModule:
if self.args.enable_musan:
logging.info("Enable MUSAN")
transforms.append(
CutMix(cuts=cuts_musan, prob=0.5, snr=(10, 20), preserve_id=True)
CutMix(cuts=cuts_musan, p=0.5, snr=(10, 20), preserve_id=True)
)
else:
logging.info("Disable MUSAN")
@ -278,8 +278,8 @@ class AishellAsrDataModule:
drop_last=self.args.drop_last,
)
else:
logging.info("Using SingleCutSampler.")
train_sampler = SingleCutSampler(
logging.info("Using SimpleCutSampler.")
train_sampler = SimpleCutSampler(
cuts_train,
max_duration=self.args.max_duration,
shuffle=self.args.shuffle,

File diff suppressed because it is too large Load Diff

View File

@ -0,0 +1 @@
../../../librispeech/ASR/zipformer/optim.py

3
egs/aishell/ASR/whisper/requirements.txt Normal file → Executable file
View File

@ -1,6 +1,5 @@
k2
kaldialign
#lhotse==1.18
git+https://github.com/lhotse-speech/lhotse
sentencepiece
tensorboard
@ -8,4 +7,4 @@ librosa
openai-whisper==20231117
zhconv
WeTextProcessing
deepspeed
deepspeed