diff --git a/egs/grid/AVSR/lipnet_ctc_vsr/decode.py b/egs/grid/AVSR/lipnet_ctc_vsr/decode.py index 4e63e53c7..d4f3910a3 100644 --- a/egs/grid/AVSR/lipnet_ctc_vsr/decode.py +++ b/egs/grid/AVSR/lipnet_ctc_vsr/decode.py @@ -142,7 +142,7 @@ def get_params() -> AttributeDict: "anno_path": Path("download/GRID/GRID_align_txt"), "val_list": Path("download/GRID/unseen_val.txt"), "vid_padding": 75, - "num_workers": 1, + "num_workers": 16, "batch_size": 120, } ) diff --git a/egs/grid/AVSR/lipnet_ctc_vsr/train.py b/egs/grid/AVSR/lipnet_ctc_vsr/train.py index 6eb985832..9caa9b55a 100644 --- a/egs/grid/AVSR/lipnet_ctc_vsr/train.py +++ b/egs/grid/AVSR/lipnet_ctc_vsr/train.py @@ -181,7 +181,7 @@ def get_params() -> AttributeDict: "train_list": Path("download/GRID/unseen_train.txt"), "vid_padding": 75, "aud_padding": 200, - "num_workers": 1, + "num_workers": 16, "batch_size": 120, } ) diff --git a/egs/grid/AVSR/local/dataset_av.py b/egs/grid/AVSR/local/dataset_av.py index 70957c14b..2f023b080 100644 --- a/egs/grid/AVSR/local/dataset_av.py +++ b/egs/grid/AVSR/local/dataset_av.py @@ -8,7 +8,7 @@ import torch import torchaudio from torch.utils.data import Dataset -from cvtransforms import HorizontalFlip, ColorNormalize +from .cvtransforms import HorizontalFlip, ColorNormalize class dataset_av(Dataset): diff --git a/egs/grid/AVSR/local/dataset_visual.py b/egs/grid/AVSR/local/dataset_visual.py index 557e8aec0..6fb826b48 100644 --- a/egs/grid/AVSR/local/dataset_visual.py +++ b/egs/grid/AVSR/local/dataset_visual.py @@ -4,7 +4,7 @@ import os import numpy as np import torch from torch.utils.data import Dataset -from cvtransforms import HorizontalFlip, ColorNormalize +from .cvtransforms import HorizontalFlip, ColorNormalize class dataset_visual(Dataset):