Initial drafts/work on bidirectional conformer

2025-08-13 12:02:21 +00:00 · 2021-09-17 13:47:54 +08:00 · 2021-09-17 13:47:54 +08:00 · cfdfcf657d
commit cfdfcf657d
parent 2b0370eb18
2 changed files with 883 additions and 95 deletions
--- a/egs/librispeech/ASR/conformer_ctc_bn_2d/conformer.py
+++ b/egs/librispeech/ASR/conformer_ctc_bn_2d/conformer.py
--- a/egs/librispeech/ASR/conformer_ctc_bn_2d/transformer.py
+++ b/egs/librispeech/ASR/conformer_ctc_bn_2d/transformer.py
@ -939,7 +939,7 @@ def decoder_padding_mask(
    return ys_mask
-def generate_square_subsequent_mask(sz: int) -> torch.Tensor:
+def generate_square_subsequent_mask(sz: int, device: torch.device = torch.device('cpu')) -> torch.Tensor:
    """Generate a square mask for the sequence. The masked positions are
    filled with float('-inf'). Unmasked positions are filled with float(0.0).
    The mask can be used for masked self-attention.
@ -956,7 +956,7 @@ def generate_square_subsequent_mask(sz: int) -> torch.Tensor:
    Returns:
      A square mask of dimension (sz, sz)
    """
-    mask = (torch.triu(torch.ones(sz, sz)) == 1).transpose(0, 1)
+    mask = (torch.triu(torch.ones(sz, sz, device=device)) == 1).transpose(0, 1)
    mask = (
        mask.float()
        .masked_fill(mask == 0, float("-inf"))