From 8515d92f47170b24c94b76684494f6a0aca516d9 Mon Sep 17 00:00:00 2001 From: Yifan Yang <64255737+yfyeung@users.noreply.github.com> Date: Tue, 27 Feb 2024 10:54:54 +0800 Subject: [PATCH] Update ssl_datamodule.py --- egs/librispeech/SSL/hubert/ssl_datamodule.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/egs/librispeech/SSL/hubert/ssl_datamodule.py b/egs/librispeech/SSL/hubert/ssl_datamodule.py index d58014ceb..07e903600 100644 --- a/egs/librispeech/SSL/hubert/ssl_datamodule.py +++ b/egs/librispeech/SSL/hubert/ssl_datamodule.py @@ -42,17 +42,17 @@ class _SeedWorkers: class LibriSpeechDataModule: """ - DataModule for ASR experiments. + DataModule for SSL experiments. It assumes there is always one train and valid dataloader, but there can be multiple test dataloaders (e.g. LibriSpeech test-clean and test-other). - It contains all the common data pipeline modules used in ASR + It contains all the common data pipeline modules used in SSL experiments, e.g.: - dynamic batch size, - bucketing samplers, - This class should be derived for specific corpora used in ASR tasks. + This class should be derived for specific corpora used in SSL tasks. """ def __init__(self, args: argparse.Namespace): @@ -61,7 +61,7 @@ class LibriSpeechDataModule: @classmethod def add_arguments(cls, parser: argparse.ArgumentParser): group = parser.add_argument_group( - title="ASR data related options", + title="SSL data related options", description="These options are used for the preparation of " "PyTorch DataLoaders from Lhotse CutSet's -- they control the " "effective batch sizes, sampling strategies.",