Speed up yesno training to finish in ~10s on CPU

Setting `persistent_workers=True` when creating DataLoader removes a significant overhead at the start of each epoch and validation.
This commit is contained in:
Piotr Żelasko 2023-08-12 20:46:25 -04:00 committed by GitHub
parent dfccadc6b6
commit 6f2128a511
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -209,7 +209,7 @@ class YesNoAsrDataModule(DataModule):
sampler=train_sampler,
batch_size=None,
num_workers=self.args.num_workers,
persistent_workers=False,
persistent_workers=True,
)
return train_dl
@ -236,6 +236,7 @@ class YesNoAsrDataModule(DataModule):
batch_size=None,
sampler=sampler,
num_workers=self.args.num_workers,
persistent_workers=True,
)
return test_dl