From 04c11b8fdbbc4e240a9056295d990e28c57df8dd Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Wed, 26 Apr 2023 12:24:15 +0900 Subject: [PATCH] from local --- .../.data2vec_audio.py.swp | Bin 40960 -> 40960 bytes .../data2vec_audio.py | 4 +--- 2 files changed, 1 insertion(+), 3 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp index 42cec984ae3abc821f3789d09db19939f3487285..77bce7b5ecd90a8e6ee8f2527bdf9a748dce3640 100644 GIT binary patch delta 395 zcmY+=!7GDt9LMqRvo_Dep4mg5%Su*raL`N+iyWR^m;)Cz8ncqiM3dxT2U{)5ji)3x zf5Q6ZY$tYbbRxnoYLZ&w##_7asaO5J_5FQ*^($6A#j3|%j-{ri!=urd5KE+Sl3XcO z?1H5^?xEGE#Z|?c9SWFjA_IDB#Zg_3uK9WxUsZ47#^=73b@yQ+WQYGHx4x0z+zPu- zWm}C;){NZ-H|j>KB>wvzX$D1(k;Z+e$Ud@I!Z2bmQ45HaFovc{51ye=zz$Lv#Ft;> z6IZyzIrjXLmo*MEh~T9|AuA_$}iBJ46dFAs}4jEcx1$SII( zXftdG+T{BW9MRBRHnh1!5JWb#HS~l_4}9Pq9vF8Ok4SIc~DE&dB;bW&#k diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py index 3ac294b3d..d99a29aa0 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py @@ -500,9 +500,7 @@ class Data2VecAudioModel(BaseFairseqModel): except: length += features.size()[1] conv_feat_all = torch.cat([conv_feat_all, features[i]]) - print(length) - print(conv_feat_all.size()) - exit() + prompt = prompt.expand((features.size()[0], prompt.size()[0], prompt.size()[1])) features = torch.cat([prompt, features], dim=1) prompt_padding_mask = torch.zeros(prompt.size()[0], prompt.size()[1]).type(torch.BoolTensor).to(features.device)