diff --git a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py
index c0a0cb2c2..cd7faba8a 100644
--- a/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py
+++ b/egs/librispeech/ASR/pruned_transducer_stateless2/scaling.py
@@ -801,7 +801,6 @@ class DecorrelateFunction(torch.autograd.Function):
             loss.backward()
 
         decorr_x_grad = x.grad
-        assert x.grad is not None
 
         # Now, normalize the magnitudes of the rows of the new grad
         # contribution, to have magnitudes equals to ctx.scale times