From d05ffc1294869db692b5e4065105da272f130b38 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Tue, 11 Apr 2023 16:50:13 +0900 Subject: [PATCH] from local --- .../.data2vec_audio.py.swp | Bin 40960 -> 40960 bytes .../.model.py.swp | Bin 28672 -> 28672 bytes .../data2vec_audio.py | 1 + 3 files changed, 1 insertion(+) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp index ea84c5876661113ccde97747db1f0f219fd8d0f4..a39ab45e25c204dc0b5d25f73a385ccb455ea019 100644 GIT binary patch delta 106 zcmZoTz|?SnX~P5oMwiVK1&Z}~53w*XyklixU=UznaG5OV@L4g6oq-_|h;@Ki8;IF~ z_%Is-Lk$p{0`a@es*V>}HjBCyF$xuB=9Op^B&MWf=B3ByCKhLFPBv7N+&sxWF9HB% C-5ZYp delta 91 zcmZoTz|?SnX~P5oM(52F1&Z}~pRq77@Uby4FbFU(I8PRI_^epT&cNUU#NI%x4#bav mvU7kq6o^48-)>fQyudQ~o2%sJcdnI;lkL^GH&1fUivR%c5f>-` diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.model.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.model.py.swp index 258053f5a4376d5c1b3159b275378fa6b503a22d..2aaae08de44bb619c129b3e970699651fadcb3a9 100644 GIT binary patch delta 32 mcmZp8z}WDBQ8dXQ%+puFQqO<^2m}}yVg*c73^t0s&IbUJtq5}f delta 32 mcmZp8z}WDBQ8dXQ%+puFQqO<^2m}}y0tHM{7&eN&&IbUIQ3y8x diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py index 383a98a00..491bb6b35 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py @@ -495,6 +495,7 @@ class Data2VecAudioModel(BaseFairseqModel): features = torch.cat([prompt, features], dim=1) prompt_padding_mask = torch.zeros(prompt.size()[0], prompt.size()[1]).type(torch.BoolTensor).to(features.device) padding_mask = torch.cat([prompt_padding_mask, padding_mask], dim=1) + print(padding_mask) features = self.layer_norm(features)