diff --git a/egs/libriheavy/ASR/zipformer_prompt_asr/asr_datamodule.py b/egs/libriheavy/ASR/zipformer_prompt_asr/asr_datamodule.py index 7a2a61a30..690003377 100644 --- a/egs/libriheavy/ASR/zipformer_prompt_asr/asr_datamodule.py +++ b/egs/libriheavy/ASR/zipformer_prompt_asr/asr_datamodule.py @@ -25,14 +25,13 @@ from typing import Any, Callable, Dict, List, Optional import torch from dataset import PromptASRDataset from lhotse import CutSet, Fbank, FbankConfig, load_manifest, load_manifest_lazy -from lhotse.dataset import ( +from lhotse.dataset import ( # SingleCutSampler, CutConcatenate, CutMix, DynamicBucketingSampler, ExtraPadding, K2SpeechRecognitionDataset, PrecomputedFeatures, - SingleCutSampler, SpecAugment, ) from lhotse.dataset.input_strategies import OnTheFlyFeatures @@ -211,7 +210,7 @@ class LibriHeavyAsrDataModule: ) group.add_argument( - "--topk-k", + "--top-k", type=int, default=10000, help="""The top-k words are identified as common words, @@ -261,7 +260,7 @@ class LibriHeavyAsrDataModule: logging.info("About to get Musan cuts") cuts_musan = load_manifest(self.args.manifest_dir / "musan_cuts.jsonl.gz") transforms.append( - CutMix(cuts=cuts_musan, prob=0.5, snr=(10, 20), preserve_id=True) + CutMix(cuts=cuts_musan, p=0.5, snr=(10, 20), preserve_id=True) ) else: logging.info("Disable MUSAN") @@ -345,11 +344,8 @@ class LibriHeavyAsrDataModule: drop_last=True, ) else: - logging.info("Using SingleCutSampler.") - train_sampler = SingleCutSampler( - cuts_train, - max_duration=self.args.max_duration, - shuffle=self.args.shuffle, + raise NotImplementedError( + "SingleCutSampler is no longer supported by lhotse" ) logging.info("About to create train dataloader") diff --git a/egs/libriheavy/ASR/zipformer_prompt_asr/dataset.py b/egs/libriheavy/ASR/zipformer_prompt_asr/dataset.py index 9602e9270..fa508ba58 100644 --- a/egs/libriheavy/ASR/zipformer_prompt_asr/dataset.py +++ b/egs/libriheavy/ASR/zipformer_prompt_asr/dataset.py @@ -205,7 +205,7 @@ def triplet_text_sampling( rare_word_list: Optional[List[str]] = None, transforms: Optional[List[Callable[[str], str]]] = None, min_len_style: Optional[int] = 80, -) -> Dict[str, str, str]: +) -> Dict[str, str]: """This function generates a triplet of (pre_text, style_text, ref_text). The style of style_text and ref_text should **always** match, whereas the style of pre_text is arbitrary.