Minor fixes after review.

2025-12-11 06:55:27 +00:00 · 2022-01-25 18:46:35 +08:00 · 2022-01-25 18:46:35 +08:00 · 4749619e5a
commit 4749619e5a
parent dd2acd89fd
1 changed files with 2 additions and 6 deletions
--- a/egs/librispeech/ASR/transducer_stateless/conformer.py
+++ b/egs/librispeech/ASR/transducer_stateless/conformer.py
@ -785,13 +785,9 @@ class RelPositionMultiheadAttention(nn.Module):
            matrix_ac + matrix_bd
        ) * scaling  # (batch, head, time1, time2)
-        attn_output_weights = attn_output_weights.view(
+        # attn_output_weights is of shape (bsz, num_heads, tgt_len, src_len)
            bsz * num_heads, tgt_len, -1
        )
-        attn_output_weights = attn_output_weights.view(
+        attn_output_weights = attn_output_weights.permute(0, 2, 3, 1)
            bsz, num_heads, tgt_len, -1
        ).permute(0, 2, 3, 1)
        # now attn_output_weights is of shape (bsz, tgt_len, src_len, num_heads)
        attn_output_weights = torch.matmul(