diff --git a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py index e490ca20d..81e49ae23 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py @@ -179,7 +179,7 @@ class ScaledLinear(nn.Linear): with torch.no_grad(): self.weight[:] *= initial_scale if self.bias is not None: - self.bias[:] *= initial_scale * 4.0 + self.bias[:] *= 2.0 * initial_scale def get_weight(self): # not needed any more but kept for back compatibility return self.weight