diff --git a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py index c0a0cb2c2..cd7faba8a 100644 --- a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py +++ b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py @@ -801,7 +801,6 @@ class DecorrelateFunction(torch.autograd.Function): loss.backward() decorr_x_grad = x.grad - assert x.grad is not None # Now, normalize the magnitudes of the rows of the new grad # contribution, to have magnitudes equals to ctx.scale times