diff --git a/egs/librispeech/ASR/pruned_transducer_stateless2/conformer.py b/egs/librispeech/ASR/pruned_transducer_stateless2/conformer.py index 85a3b4575..9c8302926 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless2/conformer.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless2/conformer.py @@ -231,7 +231,7 @@ class ConformerEncoderLayer(nn.Module): # compensate for the small scale by just producing larger output. warmup = max(warmup, 0.1) if self.training: - warmup = min(warmup, 0.99) # effectively, layer-drop with 1-in-100 prob. + warmup = min(warmup, 0.95) # effectively, layer-drop with 1-in-20 prob. alpha = 1.0 if torch.rand(()).item() <= warmup else 0.1 # macaron style feed forward module