From cdaa455848e66209272135262df6f5a0816c99c5 Mon Sep 17 00:00:00 2001 From: dohe0342 Date: Mon, 26 Dec 2022 13:27:21 +0900 Subject: [PATCH] from local --- egs/librispeech/ASR/.run_v3.sh.swp | Bin 12288 -> 12288 bytes .../.data2vec_audio.py.swp | Bin 36864 -> 40960 bytes .../data2vec_audio.py | 3 ++- 3 files changed, 2 insertions(+), 1 deletion(-) diff --git a/egs/librispeech/ASR/.run_v3.sh.swp b/egs/librispeech/ASR/.run_v3.sh.swp index 85e1973ad17a64feb2e3bed9ea14be5eec73f88e..1cd626763cd703218116b3a4c04380ed4c518c5d 100644 GIT binary patch delta 32 mcmZojXh;xGG6?hZRj|}EU;qLE28L#(mB}9t|Jf-1QXc@44hmfW delta 32 mcmZojXh;xGG6?hZRj|}EU;qLE28JUa7AHTn`n6H~r9J?e1`5mo diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/.data2vec_audio.py.swp index 0c4c90ff218c567171e693f74a2ac91dccff7f28..fec41979dd044848d2a6bc5620557b6963a7737f 100644 GIT binary patch delta 808 zcmXxiO-K}R7{~EvcE?;d*Byn{mrGM?&F-5~6?0hYbf(41#s1$bEDp06)r*=F?A+z!WACh94F1 z;+sR{5e!^(NL&uE_?j!SfEh$k3l}!`h@_A}6m|HO!%OfS&k#d3s!)gzs>pl1z%pVu zhZ+>&i(TX;`q5`U%_&&y$Bs=Tiw&$}6_2ri8H}P8K?LAORuNfJOtU%UH0s+9c}{hN z`Uk?%!|k12M@0WuUbC?+RUHp?FeMIP9oU-x|9oD%MOHA58|c9m)T11K3Pe65jU`MY z3@@@Skqpwfg+a8S0cW8jL$X`>O!^axSwzu@Qfv@s0#?jHSTX-5$~U-&UbNsiR6HQU zSqx(cmH0t|+jxs9OyU|wPzen`b1(335$PR_;uwyi6d#Fo5lP&}G_GR+5d`7KJ`^C! T1T#n?mSZZau9{DpZ#s7Yu9kd- delta 414 zcmXBQze@sf7{~GFduM5C-Bn6wpAIn%o X0uDO-vZ1`qqjJzSQls8ZsuceNE$u~h diff --git a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py index 4c9f531e4..3cc958659 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless_d2v_v2/data2vec_audio.py @@ -274,7 +274,8 @@ class Data2VecAudioModel(BaseFairseqModel): torch.FloatTensor(cfg.encoder_embed_dim).uniform_() ) - self.encoder = TransformerEncoder(cfg) + #self.encoder = TransformerEncoder(cfg) + self.encoder = TransformerEncoderAdapter(cfg) self.layer_norm = LayerNorm(self.extractor_embed) self.final_proj = nn.Linear(self.embed, self.embed)