diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp index 30a6bc658..5db563cbf 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_encoder.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py index 8c79c0f75..37ad7edf1 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_encoder.py @@ -73,15 +73,6 @@ class FairSeqData2VecEncoder(EncoderInterface): model.feature_grad_mult = 0.0 ## for conv network freeze model.mask_prob = 0.5 ## for conv network freeze - if not isinstance(model, Wav2Vec2Model): - try: - model = model.w2v_encoder.w2v_model - - except: - print( - "using data2vec ..." - ) - self.encoders = model self.pretrained_params = copy.deepcopy(model.state_dict())