diff --git a/egs/librispeech/ASR/incremental_transf/.conformer.py.swp b/egs/librispeech/ASR/incremental_transf/.conformer.py.swp index 4f9620246..6aa342984 100644 Binary files a/egs/librispeech/ASR/incremental_transf/.conformer.py.swp and b/egs/librispeech/ASR/incremental_transf/.conformer.py.swp differ diff --git a/egs/librispeech/ASR/incremental_transf/.model.py.swp b/egs/librispeech/ASR/incremental_transf/.model.py.swp index 4c51a9134..0342b02ce 100644 Binary files a/egs/librispeech/ASR/incremental_transf/.model.py.swp and b/egs/librispeech/ASR/incremental_transf/.model.py.swp differ diff --git a/egs/librispeech/ASR/incremental_transf/conformer.py b/egs/librispeech/ASR/incremental_transf/conformer.py index ca1137f31..bc697ccbb 100644 --- a/egs/librispeech/ASR/incremental_transf/conformer.py +++ b/egs/librispeech/ASR/incremental_transf/conformer.py @@ -512,7 +512,10 @@ class Tempformer(EncoderInterface): ): layer_outputs = [] for enum, encoder in enumerate(self.encoder_layers): - layer_outputs.append(encoder(x[enum])) + x_ = x[enum].permute(1, 0, 2) + encoder_output = encoder(x_) + encoder_output = encoder_output.permute(1, 0, 2) + layer_outputs.append(encoder(x_)) return layer_outputs