From 942e813915ce6d6e590bcefd9e992f5cba33ef00 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Wed, 26 Apr 2023 12:21:40 +0900 Subject: [PATCH] from local --- .../.data2vec_audio.py.swp | Bin 40960 -> 40960 bytes .../data2vec_audio.py | 5 +++-- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp index 3afcbcb3d98b4439abb3fdac4785ec2ee8f418f8..10f14087137de00c96d901f27c1978e8e2f7ca16 100644 GIT binary patch delta 203 zcmZoTz|?SnNi@kI%+puFQqO<^2m}}yGG}Li><8j*APxs&Cm@yt;=Sw)3`>Ey1c)_&_&-qBo6WM0w^=9mx(QDlRv|4lv81#pwOFq>vno|XGukkA@@)4`5rl%g{Jg5vqWoxs*vY0I aUEEL!TLlA#$$Q+DCSUbX-z@L>Fbn|0Z8{THUn`z5PJi$84wEq@fM(}IY1l$#Ogo{()D?>tmAFg$?sd(C-=GuPkz_J zG5LWe8<@@QUO9QIdj)?%QD$C=MqYkiRccXww87*;cj3uF9+i`A+{GsU@KBdj00M}b YwA93s(xTL2z2eNOR1M9|qMonA0GNh33jhEB diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py index a6e92adec..b7b015142 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py @@ -490,14 +490,15 @@ class Data2VecAudioModel(BaseFairseqModel): ## for prompt tuning if prompt is not None: - print(features.size()) conv_feat_all = torch.tensor([]).to(features.device) + length = 0 for i in range(padding_mask.size()[0]): nonzero = padding_mask[i].nonzero() try: - print(nonzero[0]) + length += nonzero[0] conv_feat_all = torch.cat([conv_feat_all, features[i, :nonzero[0], :]]) except: + length += features.size()[1] conv_feat_all = torch.cat([conv_feat_all, features[i]]) print(conv_feat_all.size()) exit()