diff --git a/egs/librispeech/ASR/conformer_ctc2/.conformer.py.swp b/egs/librispeech/ASR/conformer_ctc2/.conformer.py.swp index cf13a0034..613353d33 100644 Binary files a/egs/librispeech/ASR/conformer_ctc2/.conformer.py.swp and b/egs/librispeech/ASR/conformer_ctc2/.conformer.py.swp differ diff --git a/egs/librispeech/ASR/conformer_ctc2/conformer.py b/egs/librispeech/ASR/conformer_ctc2/conformer.py index e3e9ce522..e4fbc8fa7 100644 --- a/egs/librispeech/ASR/conformer_ctc2/conformer.py +++ b/egs/librispeech/ASR/conformer_ctc2/conformer.py @@ -138,8 +138,9 @@ class Conformer(Transformer): if self.group_num != 0: self.learnable_alpha = learnable_alpha self.group_layer_num = int(num_encoder_layers // self.group_num) - self.alpha = nn.Parameter(torch.rand(self.group_num)) - self.sigmoid = nn.Sigmoid() + if self.learnable_alpha: + self.alpha = nn.Parameter(torch.rand(self.group_num)) + self.sigmoid = nn.Sigmoid() self.layer_norm = nn.LayerNorm(d_model) self.interctc = interctc