From e9f86df7d52519f9d4b47f66dbdc514bc8525873 Mon Sep 17 00:00:00 2001 From: jinzr Date: Thu, 14 Mar 2024 09:47:04 +0800 Subject: [PATCH] Update asr_datamodule.py --- .../ASR/pruned_transducer_stateless7/asr_datamodule.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/egs/commonvoice/ASR/pruned_transducer_stateless7/asr_datamodule.py b/egs/commonvoice/ASR/pruned_transducer_stateless7/asr_datamodule.py index 41009831c..bf0a3e245 100644 --- a/egs/commonvoice/ASR/pruned_transducer_stateless7/asr_datamodule.py +++ b/egs/commonvoice/ASR/pruned_transducer_stateless7/asr_datamodule.py @@ -409,6 +409,14 @@ class CommonVoiceAsrDataModule: self.args.cv_manifest_dir / f"cv-{self.args.language}_cuts_train.jsonl.gz" ) + @lru_cache() + def validated_cuts(self) -> CutSet: + logging.info("About to get validated cuts (with dev/test removed)") + return load_manifest_lazy( + self.args.cv_manifest_dir + / f"cv-{self.args.language}_cuts_validated.jsonl.gz" + ) + @lru_cache() def dev_cuts(self) -> CutSet: logging.info("About to get dev cuts")