diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp index 639b70d50..aa2aae245 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp index c1eb94c56..96a8c318b 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py index 3732bcc2a..b1975cec6 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py @@ -128,6 +128,7 @@ class FairSeqData2VecEncoder(EncoderInterface): mask = ft, features_only=True, prompt=prompt, + sid=sid, ) xs_pad = enc_outputs["x"] # (B,T,C),