diff --git a/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/frame_reducer.py b/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/frame_reducer.py index d48887426..671b7565f 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/frame_reducer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless7_ctc_bs/frame_reducer.py @@ -80,7 +80,7 @@ class FrameReducer(nn.Module): limit_lens = T - y_lens else: # In eval mode, ensure audio that is completely silent does not make any errors - limit_lens = torch.ones_like(x_lens) + limit_lens = T - torch.ones_like(x_lens) max_limit_len = limit_lens.max().int() fake_limit_indexes = torch.topk( ctc_output[:, :, blank_id], max_limit_len