diff --git a/egs/librispeech/ASR/.run_v3.sh.swp b/egs/librispeech/ASR/.run_v3.sh.swp index 9b0e1b66d..cccf26bf7 100644 Binary files a/egs/librispeech/ASR/.run_v3.sh.swp and b/egs/librispeech/ASR/.run_v3.sh.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train.py.swp index b5563203e..ba895242c 100644 Binary files a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train.py.swp and b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.train.py.swp differ diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train.py index cc97dd06f..a700a5c66 100755 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/train.py @@ -550,13 +550,14 @@ def get_encoder_model(params: AttributeDict) -> nn.Module: num_encoder_layers=to_int_tuple(params.num_encoder_layers), ) ''' - encoder = FairSeqData2VecEncoder( - input_size=768, #params.encoder_dim, - w2v_url='None', - output_size=768, #params.encoder_dim, - freeze_finetune_updates=0, #params.freeze_finetune_updates*params.accum_grads, - additional_block=True, #params.additional_block, - ) + if params.encoder_type == 'd2v': + encoder = FairSeqData2VecEncoder( + input_size=params.encoder_dim, + w2v_url='None', + output_size=params.encoder_dim, + freeze_finetune_updates=params.freeze_finetune_updates*params.accum_grads, + additional_block=True, #params.additional_block, + ) return encoder