diff --git a/egs/librispeech/ASR/conformer_ctc2/.decode.py.swp b/egs/librispeech/ASR/conformer_ctc2/.decode.py.swp index ae84f40a1..c7871579f 100644 Binary files a/egs/librispeech/ASR/conformer_ctc2/.decode.py.swp and b/egs/librispeech/ASR/conformer_ctc2/.decode.py.swp differ diff --git a/egs/librispeech/ASR/conformer_ctc2/decode.py b/egs/librispeech/ASR/conformer_ctc2/decode.py index 2c72b1187..7c4dc7ec9 100755 --- a/egs/librispeech/ASR/conformer_ctc2/decode.py +++ b/egs/librispeech/ASR/conformer_ctc2/decode.py @@ -342,6 +342,8 @@ def decode_one_batch( supervisions = batch["supervisions"] nnet_output, memory, memory_key_padding_mask = model(feature, supervisions) + if type(nnet_output) == tuple: + nnet_output = nnet_output[0] supervision_segments = torch.stack( (